##// END OF EJS Templates
verify: call ui.progress()
Augie Fackler -
r10433:767fbacb default
parent child Browse files
Show More
@@ -1,279 +1,298 b''
1 # verify.py - repository integrity checking for Mercurial
1 # verify.py - repository integrity checking for Mercurial
2 #
2 #
3 # Copyright 2006, 2007 Matt Mackall <mpm@selenic.com>
3 # Copyright 2006, 2007 Matt Mackall <mpm@selenic.com>
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7
7
8 from node import nullid, short
8 from node import nullid, short
9 from i18n import _
9 from i18n import _
10 import os
10 import os
11 import revlog, util, error
11 import revlog, util, error
12
12
13 def verify(repo):
13 def verify(repo):
14 lock = repo.lock()
14 lock = repo.lock()
15 try:
15 try:
16 return _verify(repo)
16 return _verify(repo)
17 finally:
17 finally:
18 lock.release()
18 lock.release()
19
19
20 def _verify(repo):
20 def _verify(repo):
21 mflinkrevs = {}
21 mflinkrevs = {}
22 filelinkrevs = {}
22 filelinkrevs = {}
23 filenodes = {}
23 filenodes = {}
24 revisions = 0
24 revisions = 0
25 badrevs = set()
25 badrevs = set()
26 errors = [0]
26 errors = [0]
27 warnings = [0]
27 warnings = [0]
28 ui = repo.ui
28 ui = repo.ui
29 cl = repo.changelog
29 cl = repo.changelog
30 mf = repo.manifest
30 mf = repo.manifest
31 lrugetctx = util.lrucachefunc(repo.changectx)
31 lrugetctx = util.lrucachefunc(repo.changectx)
32
32
33 if not repo.cancopy():
33 if not repo.cancopy():
34 raise util.Abort(_("cannot verify bundle or remote repos"))
34 raise util.Abort(_("cannot verify bundle or remote repos"))
35
35
36 def err(linkrev, msg, filename=None):
36 def err(linkrev, msg, filename=None):
37 if linkrev != None:
37 if linkrev != None:
38 badrevs.add(linkrev)
38 badrevs.add(linkrev)
39 else:
39 else:
40 linkrev = '?'
40 linkrev = '?'
41 msg = "%s: %s" % (linkrev, msg)
41 msg = "%s: %s" % (linkrev, msg)
42 if filename:
42 if filename:
43 msg = "%s@%s" % (filename, msg)
43 msg = "%s@%s" % (filename, msg)
44 ui.warn(" " + msg + "\n")
44 ui.warn(" " + msg + "\n")
45 errors[0] += 1
45 errors[0] += 1
46
46
47 def exc(linkrev, msg, inst, filename=None):
47 def exc(linkrev, msg, inst, filename=None):
48 if isinstance(inst, KeyboardInterrupt):
48 if isinstance(inst, KeyboardInterrupt):
49 ui.warn(_("interrupted"))
49 ui.warn(_("interrupted"))
50 raise
50 raise
51 err(linkrev, "%s: %s" % (msg, inst), filename)
51 err(linkrev, "%s: %s" % (msg, inst), filename)
52
52
53 def warn(msg):
53 def warn(msg):
54 ui.warn(msg + "\n")
54 ui.warn(msg + "\n")
55 warnings[0] += 1
55 warnings[0] += 1
56
56
57 def checklog(obj, name, linkrev):
57 def checklog(obj, name, linkrev):
58 if not len(obj) and (havecl or havemf):
58 if not len(obj) and (havecl or havemf):
59 err(linkrev, _("empty or missing %s") % name)
59 err(linkrev, _("empty or missing %s") % name)
60 return
60 return
61
61
62 d = obj.checksize()
62 d = obj.checksize()
63 if d[0]:
63 if d[0]:
64 err(None, _("data length off by %d bytes") % d[0], name)
64 err(None, _("data length off by %d bytes") % d[0], name)
65 if d[1]:
65 if d[1]:
66 err(None, _("index contains %d extra bytes") % d[1], name)
66 err(None, _("index contains %d extra bytes") % d[1], name)
67
67
68 if obj.version != revlog.REVLOGV0:
68 if obj.version != revlog.REVLOGV0:
69 if not revlogv1:
69 if not revlogv1:
70 warn(_("warning: `%s' uses revlog format 1") % name)
70 warn(_("warning: `%s' uses revlog format 1") % name)
71 elif revlogv1:
71 elif revlogv1:
72 warn(_("warning: `%s' uses revlog format 0") % name)
72 warn(_("warning: `%s' uses revlog format 0") % name)
73
73
74 def checkentry(obj, i, node, seen, linkrevs, f):
74 def checkentry(obj, i, node, seen, linkrevs, f):
75 lr = obj.linkrev(obj.rev(node))
75 lr = obj.linkrev(obj.rev(node))
76 if lr < 0 or (havecl and lr not in linkrevs):
76 if lr < 0 or (havecl and lr not in linkrevs):
77 if lr < 0 or lr >= len(cl):
77 if lr < 0 or lr >= len(cl):
78 msg = _("rev %d points to nonexistent changeset %d")
78 msg = _("rev %d points to nonexistent changeset %d")
79 else:
79 else:
80 msg = _("rev %d points to unexpected changeset %d")
80 msg = _("rev %d points to unexpected changeset %d")
81 err(None, msg % (i, lr), f)
81 err(None, msg % (i, lr), f)
82 if linkrevs:
82 if linkrevs:
83 if f and len(linkrevs) > 1:
83 if f and len(linkrevs) > 1:
84 try:
84 try:
85 # attempt to filter down to real linkrevs
85 # attempt to filter down to real linkrevs
86 linkrevs = [l for l in linkrevs
86 linkrevs = [l for l in linkrevs
87 if lrugetctx(l)[f].filenode() == node]
87 if lrugetctx(l)[f].filenode() == node]
88 except:
88 except:
89 pass
89 pass
90 warn(_(" (expected %s)") % " ".join(map(str, linkrevs)))
90 warn(_(" (expected %s)") % " ".join(map(str, linkrevs)))
91 lr = None # can't be trusted
91 lr = None # can't be trusted
92
92
93 try:
93 try:
94 p1, p2 = obj.parents(node)
94 p1, p2 = obj.parents(node)
95 if p1 not in seen and p1 != nullid:
95 if p1 not in seen and p1 != nullid:
96 err(lr, _("unknown parent 1 %s of %s") %
96 err(lr, _("unknown parent 1 %s of %s") %
97 (short(p1), short(n)), f)
97 (short(p1), short(n)), f)
98 if p2 not in seen and p2 != nullid:
98 if p2 not in seen and p2 != nullid:
99 err(lr, _("unknown parent 2 %s of %s") %
99 err(lr, _("unknown parent 2 %s of %s") %
100 (short(p2), short(p1)), f)
100 (short(p2), short(p1)), f)
101 except Exception, inst:
101 except Exception, inst:
102 exc(lr, _("checking parents of %s") % short(node), inst, f)
102 exc(lr, _("checking parents of %s") % short(node), inst, f)
103
103
104 if node in seen:
104 if node in seen:
105 err(lr, _("duplicate revision %d (%d)") % (i, seen[n]), f)
105 err(lr, _("duplicate revision %d (%d)") % (i, seen[n]), f)
106 seen[n] = i
106 seen[n] = i
107 return lr
107 return lr
108
108
109 if os.path.exists(repo.sjoin("journal")):
109 if os.path.exists(repo.sjoin("journal")):
110 ui.warn(_("abandoned transaction found - run hg recover\n"))
110 ui.warn(_("abandoned transaction found - run hg recover\n"))
111
111
112 revlogv1 = cl.version != revlog.REVLOGV0
112 revlogv1 = cl.version != revlog.REVLOGV0
113 if ui.verbose or not revlogv1:
113 if ui.verbose or not revlogv1:
114 ui.status(_("repository uses revlog format %d\n") %
114 ui.status(_("repository uses revlog format %d\n") %
115 (revlogv1 and 1 or 0))
115 (revlogv1 and 1 or 0))
116
116
117 havecl = len(cl) > 0
117 havecl = len(cl) > 0
118 havemf = len(mf) > 0
118 havemf = len(mf) > 0
119
119
120 ui.status(_("checking changesets\n"))
120 ui.status(_("checking changesets\n"))
121 seen = {}
121 seen = {}
122 checklog(cl, "changelog", 0)
122 checklog(cl, "changelog", 0)
123 total = len(repo)
123 for i in repo:
124 for i in repo:
125 ui.progress('changelog', i, total=total)
124 n = cl.node(i)
126 n = cl.node(i)
125 checkentry(cl, i, n, seen, [i], "changelog")
127 checkentry(cl, i, n, seen, [i], "changelog")
126
128
127 try:
129 try:
128 changes = cl.read(n)
130 changes = cl.read(n)
129 mflinkrevs.setdefault(changes[0], []).append(i)
131 mflinkrevs.setdefault(changes[0], []).append(i)
130 for f in changes[3]:
132 for f in changes[3]:
131 filelinkrevs.setdefault(f, []).append(i)
133 filelinkrevs.setdefault(f, []).append(i)
132 except Exception, inst:
134 except Exception, inst:
133 exc(i, _("unpacking changeset %s") % short(n), inst)
135 exc(i, _("unpacking changeset %s") % short(n), inst)
136 ui.progress('changelog', None)
134
137
135 ui.status(_("checking manifests\n"))
138 ui.status(_("checking manifests\n"))
136 seen = {}
139 seen = {}
137 checklog(mf, "manifest", 0)
140 checklog(mf, "manifest", 0)
141 total = len(mf)
138 for i in mf:
142 for i in mf:
143 ui.progress('manifests', i, total=total)
139 n = mf.node(i)
144 n = mf.node(i)
140 lr = checkentry(mf, i, n, seen, mflinkrevs.get(n, []), "manifest")
145 lr = checkentry(mf, i, n, seen, mflinkrevs.get(n, []), "manifest")
141 if n in mflinkrevs:
146 if n in mflinkrevs:
142 del mflinkrevs[n]
147 del mflinkrevs[n]
143 else:
148 else:
144 err(lr, _("%s not in changesets") % short(n), "manifest")
149 err(lr, _("%s not in changesets") % short(n), "manifest")
145
150
146 try:
151 try:
147 for f, fn in mf.readdelta(n).iteritems():
152 for f, fn in mf.readdelta(n).iteritems():
148 if not f:
153 if not f:
149 err(lr, _("file without name in manifest"))
154 err(lr, _("file without name in manifest"))
150 elif f != "/dev/null":
155 elif f != "/dev/null":
151 filenodes.setdefault(f, {}).setdefault(fn, lr)
156 filenodes.setdefault(f, {}).setdefault(fn, lr)
152 except Exception, inst:
157 except Exception, inst:
153 exc(lr, _("reading manifest delta %s") % short(n), inst)
158 exc(lr, _("reading manifest delta %s") % short(n), inst)
159 ui.progress('manifests', None)
154
160
155 ui.status(_("crosschecking files in changesets and manifests\n"))
161 ui.status(_("crosschecking files in changesets and manifests\n"))
156
162
163 total = len(mflinkrevs) + len(filelinkrevs) + len(filenodes)
164 count = 0
157 if havemf:
165 if havemf:
158 for c, m in sorted([(c, m) for m in mflinkrevs
166 for c, m in sorted([(c, m) for m in mflinkrevs
159 for c in mflinkrevs[m]]):
167 for c in mflinkrevs[m]]):
168 count += 1
169 ui.progress('crosscheck', count, total=total)
160 err(c, _("changeset refers to unknown manifest %s") % short(m))
170 err(c, _("changeset refers to unknown manifest %s") % short(m))
161 mflinkrevs = None # del is bad here due to scope issues
171 mflinkrevs = None # del is bad here due to scope issues
162
172
163 for f in sorted(filelinkrevs):
173 for f in sorted(filelinkrevs):
174 count += 1
175 ui.progress('crosscheck', count, total=total)
164 if f not in filenodes:
176 if f not in filenodes:
165 lr = filelinkrevs[f][0]
177 lr = filelinkrevs[f][0]
166 err(lr, _("in changeset but not in manifest"), f)
178 err(lr, _("in changeset but not in manifest"), f)
167
179
168 if havecl:
180 if havecl:
169 for f in sorted(filenodes):
181 for f in sorted(filenodes):
182 count += 1
183 ui.progress('crosscheck', count, total=total)
170 if f not in filelinkrevs:
184 if f not in filelinkrevs:
171 try:
185 try:
172 fl = repo.file(f)
186 fl = repo.file(f)
173 lr = min([fl.linkrev(fl.rev(n)) for n in filenodes[f]])
187 lr = min([fl.linkrev(fl.rev(n)) for n in filenodes[f]])
174 except:
188 except:
175 lr = None
189 lr = None
176 err(lr, _("in manifest but not in changeset"), f)
190 err(lr, _("in manifest but not in changeset"), f)
177
191
192 ui.progress('crosscheck', None)
193
178 ui.status(_("checking files\n"))
194 ui.status(_("checking files\n"))
179
195
180 storefiles = set()
196 storefiles = set()
181 for f, f2, size in repo.store.datafiles():
197 for f, f2, size in repo.store.datafiles():
182 if not f:
198 if not f:
183 err(None, _("cannot decode filename '%s'") % f2)
199 err(None, _("cannot decode filename '%s'") % f2)
184 elif size > 0:
200 elif size > 0:
185 storefiles.add(f)
201 storefiles.add(f)
186
202
187 files = sorted(set(filenodes) | set(filelinkrevs))
203 files = sorted(set(filenodes) | set(filelinkrevs))
188 for f in files:
204 total = len(files)
205 for i, f in enumerate(files):
206 ui.progress('files', i, item=f, total=total)
189 try:
207 try:
190 linkrevs = filelinkrevs[f]
208 linkrevs = filelinkrevs[f]
191 except KeyError:
209 except KeyError:
192 # in manifest but not in changelog
210 # in manifest but not in changelog
193 linkrevs = []
211 linkrevs = []
194
212
195 if linkrevs:
213 if linkrevs:
196 lr = linkrevs[0]
214 lr = linkrevs[0]
197 else:
215 else:
198 lr = None
216 lr = None
199
217
200 try:
218 try:
201 fl = repo.file(f)
219 fl = repo.file(f)
202 except error.RevlogError, e:
220 except error.RevlogError, e:
203 err(lr, _("broken revlog! (%s)") % e, f)
221 err(lr, _("broken revlog! (%s)") % e, f)
204 continue
222 continue
205
223
206 for ff in fl.files():
224 for ff in fl.files():
207 try:
225 try:
208 storefiles.remove(ff)
226 storefiles.remove(ff)
209 except KeyError:
227 except KeyError:
210 err(lr, _("missing revlog!"), ff)
228 err(lr, _("missing revlog!"), ff)
211
229
212 checklog(fl, f, lr)
230 checklog(fl, f, lr)
213 seen = {}
231 seen = {}
214 for i in fl:
232 for i in fl:
215 revisions += 1
233 revisions += 1
216 n = fl.node(i)
234 n = fl.node(i)
217 lr = checkentry(fl, i, n, seen, linkrevs, f)
235 lr = checkentry(fl, i, n, seen, linkrevs, f)
218 if f in filenodes:
236 if f in filenodes:
219 if havemf and n not in filenodes[f]:
237 if havemf and n not in filenodes[f]:
220 err(lr, _("%s not in manifests") % (short(n)), f)
238 err(lr, _("%s not in manifests") % (short(n)), f)
221 else:
239 else:
222 del filenodes[f][n]
240 del filenodes[f][n]
223
241
224 # verify contents
242 # verify contents
225 try:
243 try:
226 t = fl.read(n)
244 t = fl.read(n)
227 rp = fl.renamed(n)
245 rp = fl.renamed(n)
228 if len(t) != fl.size(i):
246 if len(t) != fl.size(i):
229 if len(fl.revision(n)) != fl.size(i):
247 if len(fl.revision(n)) != fl.size(i):
230 err(lr, _("unpacked size is %s, %s expected") %
248 err(lr, _("unpacked size is %s, %s expected") %
231 (len(t), fl.size(i)), f)
249 (len(t), fl.size(i)), f)
232 except Exception, inst:
250 except Exception, inst:
233 exc(lr, _("unpacking %s") % short(n), inst, f)
251 exc(lr, _("unpacking %s") % short(n), inst, f)
234
252
235 # check renames
253 # check renames
236 try:
254 try:
237 if rp:
255 if rp:
238 if lr is not None and ui.verbose:
256 if lr is not None and ui.verbose:
239 ctx = lrugetctx(lr)
257 ctx = lrugetctx(lr)
240 found = False
258 found = False
241 for pctx in ctx.parents():
259 for pctx in ctx.parents():
242 if rp[0] in pctx:
260 if rp[0] in pctx:
243 found = True
261 found = True
244 break
262 break
245 if not found:
263 if not found:
246 warn(_("warning: copy source of '%s' not"
264 warn(_("warning: copy source of '%s' not"
247 " in parents of %s") % (f, ctx))
265 " in parents of %s") % (f, ctx))
248 fl2 = repo.file(rp[0])
266 fl2 = repo.file(rp[0])
249 if not len(fl2):
267 if not len(fl2):
250 err(lr, _("empty or missing copy source revlog %s:%s")
268 err(lr, _("empty or missing copy source revlog %s:%s")
251 % (rp[0], short(rp[1])), f)
269 % (rp[0], short(rp[1])), f)
252 elif rp[1] == nullid:
270 elif rp[1] == nullid:
253 ui.note(_("warning: %s@%s: copy source"
271 ui.note(_("warning: %s@%s: copy source"
254 " revision is nullid %s:%s\n")
272 " revision is nullid %s:%s\n")
255 % (f, lr, rp[0], short(rp[1])))
273 % (f, lr, rp[0], short(rp[1])))
256 else:
274 else:
257 fl2.rev(rp[1])
275 fl2.rev(rp[1])
258 except Exception, inst:
276 except Exception, inst:
259 exc(lr, _("checking rename of %s") % short(n), inst, f)
277 exc(lr, _("checking rename of %s") % short(n), inst, f)
260
278
261 # cross-check
279 # cross-check
262 if f in filenodes:
280 if f in filenodes:
263 fns = [(lr, n) for n, lr in filenodes[f].iteritems()]
281 fns = [(lr, n) for n, lr in filenodes[f].iteritems()]
264 for lr, node in sorted(fns):
282 for lr, node in sorted(fns):
265 err(lr, _("%s in manifests not found") % short(node), f)
283 err(lr, _("%s in manifests not found") % short(node), f)
284 ui.progress('files', None)
266
285
267 for f in storefiles:
286 for f in storefiles:
268 warn(_("warning: orphan revlog '%s'") % f)
287 warn(_("warning: orphan revlog '%s'") % f)
269
288
270 ui.status(_("%d files, %d changesets, %d total revisions\n") %
289 ui.status(_("%d files, %d changesets, %d total revisions\n") %
271 (len(files), len(cl), revisions))
290 (len(files), len(cl), revisions))
272 if warnings[0]:
291 if warnings[0]:
273 ui.warn(_("%d warnings encountered!\n") % warnings[0])
292 ui.warn(_("%d warnings encountered!\n") % warnings[0])
274 if errors[0]:
293 if errors[0]:
275 ui.warn(_("%d integrity errors encountered!\n") % errors[0])
294 ui.warn(_("%d integrity errors encountered!\n") % errors[0])
276 if badrevs:
295 if badrevs:
277 ui.warn(_("(first damaged changeset appears to be %d)\n")
296 ui.warn(_("(first damaged changeset appears to be %d)\n")
278 % min(badrevs))
297 % min(badrevs))
279 return 1
298 return 1
General Comments 0
You need to be logged in to leave comments. Login now