bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar
| 
1
by mbp at sourcefrog
 import from baz patch-364  | 
1  | 
# Copyright (C) 2004, 2005 by Martin Pool
 | 
2  | 
# Copyright (C) 2005 by Canonical Ltd
 | 
|
3  | 
||
4  | 
# This program is free software; you can redistribute it and/or modify
 | 
|
5  | 
# it under the terms of the GNU General Public License as published by
 | 
|
6  | 
# the Free Software Foundation; either version 2 of the License, or
 | 
|
7  | 
# (at your option) any later version.
 | 
|
8  | 
||
9  | 
# This program is distributed in the hope that it will be useful,
 | 
|
10  | 
# but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
|
11  | 
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
|
12  | 
# GNU General Public License for more details.
 | 
|
13  | 
||
14  | 
# You should have received a copy of the GNU General Public License
 | 
|
15  | 
# along with this program; if not, write to the Free Software
 | 
|
16  | 
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 | 
|
17  | 
||
| 
1335
by Martin Pool
 doc  | 
18  | 
# TODO: Check ancestries are correct for every revision: includes
 | 
19  | 
# every committed so far, and in a reasonable order.
 | 
|
20  | 
||
| 
1347
by Martin Pool
 - refactor check code into method object  | 
21  | 
# TODO: Also check non-mainline revisions mentioned as parents.
 | 
22  | 
||
23  | 
# TODO: Check for extra files in the control directory.
 | 
|
24  | 
||
| 
1348
by Martin Pool
 - more refactoring of check code  | 
25  | 
# TODO: Check revision, inventory and entry objects have all 
 | 
26  | 
# required fields.
 | 
|
27  | 
||
| 
1185.16.101
by mbp at sourcefrog
 todo  | 
28  | 
# TODO: Get every revision in the revision-store even if they're not
 | 
29  | 
# referenced by history and make sure they're all valid.
 | 
|
| 
1347
by Martin Pool
 - refactor check code into method object  | 
30  | 
|
| 
1104
by Martin Pool
 - Add a simple UIFactory  | 
31  | 
import bzrlib.ui  | 
| 
1130
by Martin Pool
 - check command writes output through logging not direct  | 
32  | 
from bzrlib.trace import note, warning  | 
| 
1092.2.20
by Robert Collins
 symlink and weaves, whaddya know  | 
33  | 
from bzrlib.osutils import rename, sha_string, fingerprint_file  | 
| 
1346
by Martin Pool
 - remove dead code from bzrlib.check  | 
34  | 
from bzrlib.trace import mutter  | 
35  | 
from bzrlib.errors import BzrCheckError, NoSuchRevision  | 
|
36  | 
from bzrlib.inventory import ROOT_ID  | 
|
| 
1
by mbp at sourcefrog
 import from baz patch-364  | 
37  | 
|
| 
1104
by Martin Pool
 - Add a simple UIFactory  | 
38  | 
|
| 
1347
by Martin Pool
 - refactor check code into method object  | 
39  | 
class Check(object):  | 
40  | 
"""Check a branch"""  | 
|
| 
1449
by Robert Collins
 teach check about ghosts  | 
41  | 
|
| 
1347
by Martin Pool
 - refactor check code into method object  | 
42  | 
def __init__(self, branch):  | 
43  | 
self.branch = branch  | 
|
| 
1185.67.2
by Aaron Bentley
 Renamed Branch.storage to Branch.repository  | 
44  | 
self.repository = branch.repository  | 
| 
1383
by Martin Pool
 - untabify only  | 
45  | 
self.checked_text_cnt = 0  | 
46  | 
self.checked_rev_cnt = 0  | 
|
| 
1449
by Robert Collins
 teach check about ghosts  | 
47  | 
self.ghosts = []  | 
| 
1365
by Martin Pool
 - try to avoid checking texts repeatedly  | 
48  | 
self.repeated_text_cnt = 0  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
49  | 
self.missing_parent_links = {}  | 
| 
1348
by Martin Pool
 - more refactoring of check code  | 
50  | 
self.missing_inventory_sha_cnt = 0  | 
51  | 
self.missing_revision_cnt = 0  | 
|
| 
1365
by Martin Pool
 - try to avoid checking texts repeatedly  | 
52  | 
        # maps (file-id, version) -> sha1
 | 
53  | 
self.checked_texts = {}  | 
|
| 
1185.50.28
by John Arbash Meinel
 Lots of updates for 'bzr check'  | 
54  | 
self.checked_weaves = {}  | 
| 
676
by Martin Pool
 - lock branch while checking  | 
55  | 
|
| 
1449
by Robert Collins
 teach check about ghosts  | 
56  | 
def check(self):  | 
57  | 
self.branch.lock_read()  | 
|
| 
1185.35.34
by Aaron Bentley
 Made bzr check for stored revisions missing from ancestry  | 
58  | 
self.progress = bzrlib.ui.ui_factory.progress_bar()  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
59  | 
try:  | 
| 
1510
by Robert Collins
 Merge from mpool, adjusting check to retain HTTP support.  | 
60  | 
self.progress.update('retrieving inventory', 0, 0)  | 
61  | 
            # do not put in init, as it should be done with progess,
 | 
|
62  | 
            # and inside the lock.
 | 
|
| 
1185.67.2
by Aaron Bentley
 Renamed Branch.storage to Branch.repository  | 
63  | 
self.inventory_weave = self.branch.repository.get_inventory_weave()  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
64  | 
self.history = self.branch.revision_history()  | 
65  | 
if not len(self.history):  | 
|
66  | 
                # nothing to see here
 | 
|
67  | 
                return
 | 
|
| 
1510
by Robert Collins
 Merge from mpool, adjusting check to retain HTTP support.  | 
68  | 
self.plan_revisions()  | 
69  | 
revno = 0  | 
|
| 
1185.50.28
by John Arbash Meinel
 Lots of updates for 'bzr check'  | 
70  | 
self.check_weaves()  | 
| 
1510
by Robert Collins
 Merge from mpool, adjusting check to retain HTTP support.  | 
71  | 
while revno < len(self.planned_revisions):  | 
72  | 
rev_id = self.planned_revisions[revno]  | 
|
73  | 
self.progress.update('checking revision', revno,  | 
|
| 
1449
by Robert Collins
 teach check about ghosts  | 
74  | 
len(self.planned_revisions))  | 
| 
1510
by Robert Collins
 Merge from mpool, adjusting check to retain HTTP support.  | 
75  | 
revno += 1  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
76  | 
self.check_one_rev(rev_id)  | 
| 
1185.35.34
by Aaron Bentley
 Made bzr check for stored revisions missing from ancestry  | 
77  | 
finally:  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
78  | 
self.progress.clear()  | 
79  | 
self.branch.unlock()  | 
|
80  | 
||
| 
1510
by Robert Collins
 Merge from mpool, adjusting check to retain HTTP support.  | 
81  | 
def plan_revisions(self):  | 
| 
1185.67.2
by Aaron Bentley
 Renamed Branch.storage to Branch.repository  | 
82  | 
repository = self.branch.repository  | 
83  | 
if not repository.revision_store.listable():  | 
|
84  | 
self.planned_revisions = repository.get_ancestry(self.history[-1])  | 
|
| 
1510
by Robert Collins
 Merge from mpool, adjusting check to retain HTTP support.  | 
85  | 
self.planned_revisions.remove(None)  | 
86  | 
            # FIXME progress bars should support this more nicely.
 | 
|
87  | 
self.progress.clear()  | 
|
88  | 
print ("Checking reachable history -"  | 
|
89  | 
" for a complete check use a local branch.")  | 
|
90  | 
            return
 | 
|
91  | 
||
| 
1185.67.2
by Aaron Bentley
 Renamed Branch.storage to Branch.repository  | 
92  | 
self.planned_revisions = set(repository.revision_store)  | 
| 
1510
by Robert Collins
 Merge from mpool, adjusting check to retain HTTP support.  | 
93  | 
inventoried = set(self.inventory_weave.names())  | 
94  | 
awol = self.planned_revisions - inventoried  | 
|
95  | 
if len(awol) > 0:  | 
|
96  | 
raise BzrCheckError('Stored revisions missing from inventory'  | 
|
97  | 
'{%s}' % ','.join([f for f in awol]))  | 
|
98  | 
self.planned_revisions = list(self.planned_revisions)  | 
|
99  | 
||
| 
1449
by Robert Collins
 teach check about ghosts  | 
100  | 
def report_results(self, verbose):  | 
| 
1534.4.26
by Robert Collins
 Move working tree initialisation out from Branch.initialize, deprecated Branch.initialize to Branch.create.  | 
101  | 
note('checked branch %s format %s',  | 
| 
1383
by Martin Pool
 - untabify only  | 
102  | 
self.branch.base,  | 
| 
1534.4.44
by Robert Collins
 Make a new BzrDir format that uses a versioned branch format in a branch/ subdirectory.  | 
103  | 
self.branch._format)  | 
| 
1348
by Martin Pool
 - more refactoring of check code  | 
104  | 
|
| 
1365
by Martin Pool
 - try to avoid checking texts repeatedly  | 
105  | 
note('%6d revisions', self.checked_rev_cnt)  | 
106  | 
note('%6d unique file texts', self.checked_text_cnt)  | 
|
107  | 
note('%6d repeated file texts', self.repeated_text_cnt)  | 
|
| 
1185.50.28
by John Arbash Meinel
 Lots of updates for 'bzr check'  | 
108  | 
note('%6d weaves', len(self.checked_weaves))  | 
| 
1348
by Martin Pool
 - more refactoring of check code  | 
109  | 
if self.missing_inventory_sha_cnt:  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
110  | 
note('%6d revisions are missing inventory_sha1',  | 
| 
1383
by Martin Pool
 - untabify only  | 
111  | 
self.missing_inventory_sha_cnt)  | 
| 
1348
by Martin Pool
 - more refactoring of check code  | 
112  | 
if self.missing_revision_cnt:  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
113  | 
note('%6d revisions are mentioned but not present',  | 
| 
1383
by Martin Pool
 - untabify only  | 
114  | 
self.missing_revision_cnt)  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
115  | 
if len(self.ghosts):  | 
116  | 
note('%6d ghost revisions', len(self.ghosts))  | 
|
117  | 
if verbose:  | 
|
118  | 
for ghost in self.ghosts:  | 
|
119  | 
note(' %s', ghost)  | 
|
120  | 
if len(self.missing_parent_links):  | 
|
121  | 
note('%6d revisions missing parents in ancestry',  | 
|
122  | 
len(self.missing_parent_links))  | 
|
123  | 
if verbose:  | 
|
124  | 
for link, linkers in self.missing_parent_links.items():  | 
|
125  | 
note(' %s should be in the ancestry for:', link)  | 
|
126  | 
for linker in linkers:  | 
|
127  | 
note(' * %s', linker)  | 
|
128  | 
||
129  | 
def check_one_rev(self, rev_id):  | 
|
| 
1383
by Martin Pool
 - untabify only  | 
130  | 
"""Check one revision.  | 
131  | 
||
132  | 
        rev_id - the one to check
 | 
|
133  | 
||
134  | 
        last_rev_id - the previous one on the mainline, if any.
 | 
|
135  | 
        """
 | 
|
136  | 
||
| 
1185.31.4
by John Arbash Meinel
 Fixing mutter() calls to not have to do string processing.  | 
137  | 
        # mutter('    revision {%s}', rev_id)
 | 
| 
1383
by Martin Pool
 - untabify only  | 
138  | 
branch = self.branch  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
139  | 
try:  | 
140  | 
rev_history_position = self.history.index(rev_id)  | 
|
141  | 
except ValueError:  | 
|
142  | 
rev_history_position = None  | 
|
143  | 
last_rev_id = None  | 
|
144  | 
if rev_history_position:  | 
|
| 
1185.67.2
by Aaron Bentley
 Renamed Branch.storage to Branch.repository  | 
145  | 
rev = branch.repository.get_revision(rev_id)  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
146  | 
if rev_history_position > 0:  | 
147  | 
last_rev_id = self.history[rev_history_position - 1]  | 
|
148  | 
else:  | 
|
| 
1185.67.2
by Aaron Bentley
 Renamed Branch.storage to Branch.repository  | 
149  | 
rev = branch.repository.get_revision(rev_id)  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
150  | 
|
| 
1383
by Martin Pool
 - untabify only  | 
151  | 
if rev.revision_id != rev_id:  | 
152  | 
raise BzrCheckError('wrong internal revision id in revision {%s}'  | 
|
153  | 
% rev_id)  | 
|
154  | 
||
155  | 
        # check the previous history entry is a parent of this entry
 | 
|
156  | 
if rev.parent_ids:  | 
|
| 
1449
by Robert Collins
 teach check about ghosts  | 
157  | 
if last_rev_id is not None:  | 
158  | 
for parent_id in rev.parent_ids:  | 
|
159  | 
if parent_id == last_rev_id:  | 
|
160  | 
                        break
 | 
|
161  | 
else:  | 
|
162  | 
raise BzrCheckError("previous revision {%s} not listed among "  | 
|
163  | 
"parents of {%s}"  | 
|
164  | 
% (last_rev_id, rev_id))  | 
|
165  | 
for parent in rev.parent_ids:  | 
|
166  | 
if not parent in self.planned_revisions:  | 
|
167  | 
missing_links = self.missing_parent_links.get(parent, [])  | 
|
168  | 
missing_links.append(rev_id)  | 
|
169  | 
self.missing_parent_links[parent] = missing_links  | 
|
| 
1510
by Robert Collins
 Merge from mpool, adjusting check to retain HTTP support.  | 
170  | 
                    # list based so somewhat slow,
 | 
171  | 
                    # TODO have a planned_revisions list and set.
 | 
|
| 
1449
by Robert Collins
 teach check about ghosts  | 
172  | 
if self.branch.has_revision(parent):  | 
| 
1185.67.2
by Aaron Bentley
 Renamed Branch.storage to Branch.repository  | 
173  | 
missing_ancestry = self.repository.get_ancestry(parent)  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
174  | 
for missing in missing_ancestry:  | 
175  | 
if (missing is not None  | 
|
176  | 
and missing not in self.planned_revisions):  | 
|
177  | 
self.planned_revisions.append(missing)  | 
|
178  | 
else:  | 
|
179  | 
self.ghosts.append(rev_id)  | 
|
| 
1383
by Martin Pool
 - untabify only  | 
180  | 
elif last_rev_id:  | 
181  | 
raise BzrCheckError("revision {%s} has no parents listed "  | 
|
182  | 
"but preceded by {%s}"  | 
|
183  | 
% (rev_id, last_rev_id))  | 
|
184  | 
||
185  | 
if rev.inventory_sha1:  | 
|
| 
1185.67.2
by Aaron Bentley
 Renamed Branch.storage to Branch.repository  | 
186  | 
inv_sha1 = branch.repository.get_inventory_sha1(rev_id)  | 
| 
1383
by Martin Pool
 - untabify only  | 
187  | 
if inv_sha1 != rev.inventory_sha1:  | 
188  | 
raise BzrCheckError('Inventory sha1 hash doesn\'t match'  | 
|
189  | 
' value in revision {%s}' % rev_id)  | 
|
190  | 
else:  | 
|
191  | 
missing_inventory_sha_cnt += 1  | 
|
| 
1185.31.4
by John Arbash Meinel
 Fixing mutter() calls to not have to do string processing.  | 
192  | 
mutter("no inventory_sha1 on revision {%s}", rev_id)  | 
| 
1383
by Martin Pool
 - untabify only  | 
193  | 
self._check_revision_tree(rev_id)  | 
| 
1362
by Martin Pool
 - keep track of number of checked revisions  | 
194  | 
self.checked_rev_cnt += 1  | 
| 
1349
by Martin Pool
 - more refactoring of check code  | 
195  | 
|
| 
1185.50.28
by John Arbash Meinel
 Lots of updates for 'bzr check'  | 
196  | 
def check_weaves(self):  | 
197  | 
"""Check all the weaves we can get our hands on.  | 
|
198  | 
        """
 | 
|
199  | 
n_weaves = 1  | 
|
200  | 
weave_ids = []  | 
|
| 
1185.65.17
by Robert Collins
 Merge from integration, mode-changes are broken.  | 
201  | 
if self.branch.repository.weave_store.listable():  | 
202  | 
weave_ids = list(self.branch.repository.weave_store)  | 
|
| 
1185.50.28
by John Arbash Meinel
 Lots of updates for 'bzr check'  | 
203  | 
n_weaves = len(weave_ids)  | 
204  | 
self.progress.update('checking weave', 0, n_weaves)  | 
|
205  | 
self.inventory_weave.check(progress_bar=self.progress)  | 
|
206  | 
for i, weave_id in enumerate(weave_ids):  | 
|
207  | 
self.progress.update('checking weave', i, n_weaves)  | 
|
| 
1185.65.17
by Robert Collins
 Merge from integration, mode-changes are broken.  | 
208  | 
w = self.branch.repository.weave_store.get_weave(weave_id,  | 
209  | 
self.branch.repository.get_transaction())  | 
|
| 
1185.50.28
by John Arbash Meinel
 Lots of updates for 'bzr check'  | 
210  | 
            # No progress here, because it looks ugly.
 | 
211  | 
w.check()  | 
|
212  | 
self.checked_weaves[weave_id] = True  | 
|
213  | 
||
| 
1349
by Martin Pool
 - more refactoring of check code  | 
214  | 
def _check_revision_tree(self, rev_id):  | 
| 
1185.67.2
by Aaron Bentley
 Renamed Branch.storage to Branch.repository  | 
215  | 
tree = self.branch.repository.revision_tree(rev_id)  | 
| 
1383
by Martin Pool
 - untabify only  | 
216  | 
inv = tree.inventory  | 
217  | 
seen_ids = {}  | 
|
218  | 
for file_id in inv:  | 
|
219  | 
if file_id in seen_ids:  | 
|
220  | 
raise BzrCheckError('duplicated file_id {%s} '  | 
|
221  | 
'in inventory for revision {%s}'  | 
|
222  | 
% (file_id, rev_id))  | 
|
223  | 
seen_ids[file_id] = True  | 
|
224  | 
for file_id in inv:  | 
|
| 
1092.2.20
by Robert Collins
 symlink and weaves, whaddya know  | 
225  | 
ie = inv[file_id]  | 
226  | 
ie.check(self, rev_id, inv, tree)  | 
|
| 
1383
by Martin Pool
 - untabify only  | 
227  | 
seen_names = {}  | 
228  | 
for path, ie in inv.iter_entries():  | 
|
229  | 
if path in seen_names:  | 
|
230  | 
raise BzrCheckError('duplicated path %s '  | 
|
231  | 
'in inventory for revision {%s}'  | 
|
232  | 
% (path, rev_id))  | 
|
233  | 
seen_names[path] = True  | 
|
| 
1349
by Martin Pool
 - more refactoring of check code  | 
234  | 
|
| 
1347
by Martin Pool
 - refactor check code into method object  | 
235  | 
|
| 
1449
by Robert Collins
 teach check about ghosts  | 
236  | 
def check(branch, verbose):  | 
| 
1347
by Martin Pool
 - refactor check code into method object  | 
237  | 
"""Run consistency checks on a branch."""  | 
| 
1449
by Robert Collins
 teach check about ghosts  | 
238  | 
checker = Check(branch)  | 
239  | 
checker.check()  | 
|
240  | 
checker.report_results(verbose)  |