~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/check.py

  • Committer: Robert Collins
  • Date: 2005-10-03 02:10:02 UTC
  • mto: (1393.1.30)
  • mto: This revision was merged to the branch mainline in revision 1400.
  • Revision ID: robertc@robertcollins.net-20051003021002-4bf750e1d2bf7149
move checks for versionability of file kinds into InventoryEntry

Show diffs side-by-side

added added

removed removed

Lines of Context:
25
25
# TODO: Check revision, inventory and entry objects have all 
26
26
# required fields.
27
27
 
28
 
# TODO: Get every revision in the revision-store even if they're not
29
 
# referenced by history and make sure they're all valid.
30
28
 
31
29
import bzrlib.ui
32
30
from bzrlib.trace import note, warning
34
32
from bzrlib.trace import mutter
35
33
from bzrlib.errors import BzrCheckError, NoSuchRevision
36
34
from bzrlib.inventory import ROOT_ID
 
35
from bzrlib.branch import gen_root_id
37
36
 
38
37
 
39
38
class Check(object):
40
39
    """Check a branch"""
41
 
 
42
40
    def __init__(self, branch):
43
41
        self.branch = branch
 
42
        branch.lock_read()
 
43
        try:
 
44
            branch.weave_store.enable_cache = True
 
45
            branch.control_weaves.enable_cache = True
 
46
            self.run()
 
47
        finally:
 
48
            branch.unlock()
 
49
            branch.weave_store.enable_cache = False
 
50
            branch.control_weaves.enable_cache = False
 
51
 
 
52
 
 
53
    def run(self):
 
54
        branch = self.branch
 
55
 
 
56
 
44
57
        self.checked_text_cnt = 0
45
58
        self.checked_rev_cnt = 0
46
 
        self.ghosts = []
47
59
        self.repeated_text_cnt = 0
48
 
        self.missing_parent_links = {}
49
60
        self.missing_inventory_sha_cnt = 0
50
61
        self.missing_revision_cnt = 0
51
62
        # maps (file-id, version) -> sha1
52
63
        self.checked_texts = {}
53
64
 
54
 
    def check(self):
55
 
        self.branch.lock_read()
 
65
        history = branch.revision_history()
 
66
        revno = 0
 
67
        revcount = len(history)
 
68
 
 
69
        last_rev_id = None
56
70
        self.progress = bzrlib.ui.ui_factory.progress_bar()
57
 
        try:
58
 
            self.progress.update('retrieving inventory', 0, 0)
59
 
            # do not put in init, as it should be done with progess,
60
 
            # and inside the lock.
61
 
            self.inventory_weave = self.branch._get_inventory_weave()
62
 
            self.history = self.branch.revision_history()
63
 
            if not len(self.history):
64
 
                # nothing to see here
65
 
                return
66
 
            self.plan_revisions()
67
 
            revno = 0
68
 
            while revno < len(self.planned_revisions):
69
 
                rev_id = self.planned_revisions[revno]
70
 
                self.progress.update('checking revision', revno,
71
 
                                     len(self.planned_revisions))
72
 
                revno += 1
73
 
                self.check_one_rev(rev_id)
74
 
        finally:
75
 
            self.progress.clear()
76
 
            self.branch.unlock()
77
 
 
78
 
    def plan_revisions(self):
79
 
        if not self.branch.revision_store.listable():
80
 
            self.planned_revisions = self.branch.get_ancestry(self.history[-1])
81
 
            self.planned_revisions.remove(None)
82
 
            # FIXME progress bars should support this more nicely.
83
 
            self.progress.clear()
84
 
            print ("Checking reachable history -"
85
 
                   " for a complete check use a local branch.")
86
 
            return
87
 
        
88
 
        self.planned_revisions = set(self.branch.revision_store)
89
 
        inventoried = set(self.inventory_weave.names())
90
 
        awol = self.planned_revisions - inventoried
91
 
        if len(awol) > 0:
92
 
            raise BzrCheckError('Stored revisions missing from inventory'
93
 
                '{%s}' % ','.join([f for f in awol]))
94
 
        self.planned_revisions = list(self.planned_revisions)
95
 
 
96
 
    def report_results(self, verbose):
 
71
        for rev_id in history:
 
72
            self.progress.update('checking revision', revno, revcount)
 
73
            revno += 1
 
74
            self.check_one_rev(rev_id, last_rev_id)
 
75
            last_rev_id = rev_id
 
76
        self.progress.clear()
 
77
        self.report_results()
 
78
 
 
79
 
 
80
    def report_results(self):
97
81
        note('checked branch %s format %d',
98
82
             self.branch.base, 
99
83
             self.branch._branch_format)
102
86
        note('%6d unique file texts', self.checked_text_cnt)
103
87
        note('%6d repeated file texts', self.repeated_text_cnt)
104
88
        if self.missing_inventory_sha_cnt:
105
 
            note('%6d revisions are missing inventory_sha1',
 
89
            note('%d revisions are missing inventory_sha1',
106
90
                 self.missing_inventory_sha_cnt)
107
91
        if self.missing_revision_cnt:
108
 
            note('%6d revisions are mentioned but not present',
 
92
            note('%d revisions are mentioned but not present',
109
93
                 self.missing_revision_cnt)
110
 
        if len(self.ghosts):
111
 
            note('%6d ghost revisions', len(self.ghosts))
112
 
            if verbose:
113
 
                for ghost in self.ghosts:
114
 
                    note('      %s', ghost)
115
 
        if len(self.missing_parent_links):
116
 
            note('%6d revisions missing parents in ancestry', 
117
 
                 len(self.missing_parent_links))
118
 
            if verbose:
119
 
                for link, linkers in self.missing_parent_links.items():
120
 
                    note('      %s should be in the ancestry for:', link)
121
 
                    for linker in linkers:
122
 
                        note('       * %s', linker)
123
 
 
124
 
    def check_one_rev(self, rev_id):
 
94
 
 
95
 
 
96
    def check_one_rev(self, rev_id, last_rev_id):
125
97
        """Check one revision.
126
98
 
127
99
        rev_id - the one to check
129
101
        last_rev_id - the previous one on the mainline, if any.
130
102
        """
131
103
 
132
 
        # mutter('    revision {%s}', rev_id)
 
104
        # mutter('    revision {%s}' % rev_id)
133
105
        branch = self.branch
134
 
        try:
135
 
            rev_history_position = self.history.index(rev_id)
136
 
        except ValueError:
137
 
            rev_history_position = None
138
 
        last_rev_id = None
139
 
        if rev_history_position:
140
 
            rev = branch.get_revision(rev_id)
141
 
            if rev_history_position > 0:
142
 
                last_rev_id = self.history[rev_history_position - 1]
143
 
        else:
144
 
            rev = branch.get_revision(rev_id)
145
 
                
 
106
        rev = branch.get_revision(rev_id)
146
107
        if rev.revision_id != rev_id:
147
108
            raise BzrCheckError('wrong internal revision id in revision {%s}'
148
109
                                % rev_id)
149
110
 
150
111
        # check the previous history entry is a parent of this entry
151
112
        if rev.parent_ids:
152
 
            if last_rev_id is not None:
153
 
                for parent_id in rev.parent_ids:
154
 
                    if parent_id == last_rev_id:
155
 
                        break
156
 
                else:
157
 
                    raise BzrCheckError("previous revision {%s} not listed among "
158
 
                                        "parents of {%s}"
159
 
                                        % (last_rev_id, rev_id))
160
 
            for parent in rev.parent_ids:
161
 
                if not parent in self.planned_revisions:
162
 
                    missing_links = self.missing_parent_links.get(parent, [])
163
 
                    missing_links.append(rev_id)
164
 
                    self.missing_parent_links[parent] = missing_links
165
 
                    # list based so somewhat slow,
166
 
                    # TODO have a planned_revisions list and set.
167
 
                    if self.branch.has_revision(parent):
168
 
                        missing_ancestry = self.branch.get_ancestry(parent)
169
 
                        for missing in missing_ancestry:
170
 
                            if (missing is not None 
171
 
                                and missing not in self.planned_revisions):
172
 
                                self.planned_revisions.append(missing)
173
 
                    else:
174
 
                        self.ghosts.append(rev_id)
 
113
            if last_rev_id is None:
 
114
                raise BzrCheckError("revision {%s} has %d parents, but is the "
 
115
                                    "start of the branch"
 
116
                                    % (rev_id, len(rev.parent_ids)))
 
117
            for parent_id in rev.parent_ids:
 
118
                if parent_id == last_rev_id:
 
119
                    break
 
120
            else:
 
121
                raise BzrCheckError("previous revision {%s} not listed among "
 
122
                                    "parents of {%s}"
 
123
                                    % (last_rev_id, rev_id))
175
124
        elif last_rev_id:
176
125
            raise BzrCheckError("revision {%s} has no parents listed "
177
126
                                "but preceded by {%s}"
184
133
                    ' value in revision {%s}' % rev_id)
185
134
        else:
186
135
            missing_inventory_sha_cnt += 1
187
 
            mutter("no inventory_sha1 on revision {%s}", rev_id)
 
136
            mutter("no inventory_sha1 on revision {%s}" % rev_id)
188
137
        self._check_revision_tree(rev_id)
189
138
        self.checked_rev_cnt += 1
190
139
 
210
159
            seen_names[path] = True
211
160
 
212
161
 
213
 
def check(branch, verbose):
 
162
def check(branch):
214
163
    """Run consistency checks on a branch."""
215
 
    checker = Check(branch)
216
 
    checker.check()
217
 
    checker.report_results(verbose)
 
164
    Check(branch)