19
15
# along with this program; if not, write to the Free Software
20
16
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
24
######################################################################
28
"""Consistency check of tree."""
30
mutter("checking tree")
32
check_patch_chaining()
33
check_patch_uniqueness()
35
mutter("tree looks OK")
36
## TODO: Check that previous-inventory and previous-manifest
37
## are the same as those stored in the previous changeset.
39
## TODO: Check all patches present in patch directory are
40
## mentioned in patch history; having an orphaned patch only gives
43
## TODO: Check cached data is consistent with data reconstructed
46
## TODO: Check no control files are versioned.
48
## TODO: Check that the before-hash of each file in a later
49
## revision matches the after-hash in the previous revision to
53
def check_inventory():
54
mutter("checking inventory file and ids...")
58
for l in controlfile('inventory').readlines():
61
bailout("malformed inventory line: " + `l`)
64
if file_id in seen_ids:
65
bailout("duplicated file id " + file_id)
68
if name in seen_names:
69
bailout("duplicated file name in inventory: " + quotefn(name))
72
if is_control_file(name):
73
raise BzrError("control file %s present in inventory" % quotefn(name))
76
def check_patches_exist():
77
"""Check constraint of current version: all patches exist"""
78
mutter("checking all patches are present...")
79
for pid in revision_history():
80
read_patch_header(pid)
83
def check_patch_chaining():
84
"""Check ancestry of patches and history file is consistent"""
85
mutter("checking patch chaining...")
87
for pid in revision_history():
88
log_prev = read_patch_header(pid).precursor
90
bailout("inconsistent precursor links on " + pid)
94
def check_patch_uniqueness():
95
"""Make sure no patch is listed twice in the history.
97
This should be implied by having correct ancestry but I'll check it
99
mutter("checking history for duplicates...")
101
for pid in revision_history():
103
bailout("patch " + pid + " appears twice in history")
18
# TODO: Check ancestries are correct for every revision: includes
19
# every committed so far, and in a reasonable order.
21
# TODO: Also check non-mainline revisions mentioned as parents.
23
# TODO: Check for extra files in the control directory.
25
# TODO: Check revision, inventory and entry objects have all
30
from bzrlib.trace import note, warning
31
from bzrlib.osutils import rename, sha_string, fingerprint_file, sha_strings
32
from bzrlib.trace import mutter
33
from bzrlib.errors import BzrCheckError, NoSuchRevision
34
from bzrlib.inventory import ROOT_ID
35
from bzrlib.branch import gen_root_id
40
def __init__(self, branch):
44
branch.weave_store.enable_cache = True
45
branch.control_weaves.enable_cache = True
49
branch.weave_store.enable_cache = False
50
branch.control_weaves.enable_cache = False
57
self.checked_text_cnt = 0
58
self.checked_rev_cnt = 0
59
self.repeated_text_cnt = 0
60
self.missing_inventory_sha_cnt = 0
61
self.missing_revision_cnt = 0
62
# maps (file-id, version) -> sha1
63
self.checked_texts = {}
65
history = branch.revision_history()
67
revcount = len(history)
70
self.progress = bzrlib.ui.ui_factory.progress_bar()
71
for rev_id in history:
72
self.progress.update('checking revision', revno, revcount)
74
self.check_one_rev(rev_id, last_rev_id)
80
def report_results(self):
81
note('checked branch %s format %d',
83
self.branch._branch_format)
85
note('%6d revisions', self.checked_rev_cnt)
86
note('%6d unique file texts', self.checked_text_cnt)
87
note('%6d repeated file texts', self.repeated_text_cnt)
88
if self.missing_inventory_sha_cnt:
89
note('%d revisions are missing inventory_sha1',
90
self.missing_inventory_sha_cnt)
91
if self.missing_revision_cnt:
92
note('%d revisions are mentioned but not present',
93
self.missing_revision_cnt)
96
def check_one_rev(self, rev_id, last_rev_id):
97
"""Check one revision.
99
rev_id - the one to check
101
last_rev_id - the previous one on the mainline, if any.
104
# mutter(' revision {%s}' % rev_id)
106
rev = branch.get_revision(rev_id)
107
if rev.revision_id != rev_id:
108
raise BzrCheckError('wrong internal revision id in revision {%s}'
111
# check the previous history entry is a parent of this entry
113
if last_rev_id is None:
114
raise BzrCheckError("revision {%s} has %d parents, but is the "
115
"start of the branch"
116
% (rev_id, len(rev.parent_ids)))
117
for parent_id in rev.parent_ids:
118
if parent_id == last_rev_id:
121
raise BzrCheckError("previous revision {%s} not listed among "
123
% (last_rev_id, rev_id))
125
raise BzrCheckError("revision {%s} has no parents listed "
126
"but preceded by {%s}"
127
% (rev_id, last_rev_id))
129
if rev.inventory_sha1:
130
inv_sha1 = branch.get_inventory_sha1(rev_id)
131
if inv_sha1 != rev.inventory_sha1:
132
raise BzrCheckError('Inventory sha1 hash doesn\'t match'
133
' value in revision {%s}' % rev_id)
135
missing_inventory_sha_cnt += 1
136
mutter("no inventory_sha1 on revision {%s}" % rev_id)
137
self._check_revision_tree(rev_id)
138
self.checked_rev_cnt += 1
140
def _check_revision_tree(self, rev_id):
141
tree = self.branch.revision_tree(rev_id)
145
if file_id in seen_ids:
146
raise BzrCheckError('duplicated file_id {%s} '
147
'in inventory for revision {%s}'
149
seen_ids[file_id] = True
151
self._check_one_entry(rev_id, inv, tree, file_id)
153
for path, ie in inv.iter_entries():
154
if path in seen_names:
155
raise BzrCheckError('duplicated path %s '
156
'in inventory for revision {%s}'
158
seen_names[path] = True
161
def _check_one_entry(self, rev_id, inv, tree, file_id):
163
if ie.parent_id != None:
164
if not inv.has_id(ie.parent_id):
165
raise BzrCheckError('missing parent {%s} in inventory for revision {%s}'
166
% (ie.parent_id, rev_id))
167
if ie.kind == 'file':
168
text_version = ie.text_version
169
t = (file_id, text_version)
170
if t in self.checked_texts:
171
prev_sha = self.checked_texts[t]
172
if prev_sha != ie.text_sha1:
173
raise BzrCheckError('mismatched sha1 on {%s} in {%s}' %
176
self.repeated_text_cnt += 1
178
mutter('check version {%s} of {%s}', rev_id, file_id)
179
file_lines = tree.get_file_lines(file_id)
180
self.checked_text_cnt += 1
181
if ie.text_size != sum(map(len, file_lines)):
182
raise BzrCheckError('text {%s} wrong size' % ie.text_id)
183
if ie.text_sha1 != sha_strings(file_lines):
184
raise BzrCheckError('text {%s} wrong sha1' % ie.text_id)
185
self.checked_texts[t] = ie.text_sha1
186
elif ie.kind == 'directory':
187
if ie.text_sha1 != None or ie.text_size != None or ie.text_id != None:
188
raise BzrCheckError('directory {%s} has text in revision {%s}'
190
elif ie.kind == 'root_directory':
193
raise BzrCheckError('unknown entry kind %r in revision {%s}' %
198
"""Run consistency checks on a branch."""