##// END OF EJS Templates
verify: filter the candidate list for broken linkrevs
Matt Mackall -
r9657:96c803e9 default
parent child Browse files
Show More
@@ -1,269 +1,274 b''
1 # verify.py - repository integrity checking for Mercurial
1 # verify.py - repository integrity checking for Mercurial
2 #
2 #
3 # Copyright 2006, 2007 Matt Mackall <mpm@selenic.com>
3 # Copyright 2006, 2007 Matt Mackall <mpm@selenic.com>
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2, incorporated herein by reference.
6 # GNU General Public License version 2, incorporated herein by reference.
7
7
8 from node import nullid, short
8 from node import nullid, short
9 from i18n import _
9 from i18n import _
10 import revlog, util, error
10 import revlog, util, error
11
11
12 def verify(repo):
12 def verify(repo):
13 lock = repo.lock()
13 lock = repo.lock()
14 try:
14 try:
15 return _verify(repo)
15 return _verify(repo)
16 finally:
16 finally:
17 lock.release()
17 lock.release()
18
18
19 def _verify(repo):
19 def _verify(repo):
20 mflinkrevs = {}
20 mflinkrevs = {}
21 filelinkrevs = {}
21 filelinkrevs = {}
22 filenodes = {}
22 filenodes = {}
23 revisions = 0
23 revisions = 0
24 badrevs = set()
24 badrevs = set()
25 errors = [0]
25 errors = [0]
26 warnings = [0]
26 warnings = [0]
27 ui = repo.ui
27 ui = repo.ui
28 cl = repo.changelog
28 cl = repo.changelog
29 mf = repo.manifest
29 mf = repo.manifest
30 lrugetctx = util.lrucachefunc(repo.changectx)
30
31
31 if not repo.cancopy():
32 if not repo.cancopy():
32 raise util.Abort(_("cannot verify bundle or remote repos"))
33 raise util.Abort(_("cannot verify bundle or remote repos"))
33
34
34 def err(linkrev, msg, filename=None):
35 def err(linkrev, msg, filename=None):
35 if linkrev != None:
36 if linkrev != None:
36 badrevs.add(linkrev)
37 badrevs.add(linkrev)
37 else:
38 else:
38 linkrev = '?'
39 linkrev = '?'
39 msg = "%s: %s" % (linkrev, msg)
40 msg = "%s: %s" % (linkrev, msg)
40 if filename:
41 if filename:
41 msg = "%s@%s" % (filename, msg)
42 msg = "%s@%s" % (filename, msg)
42 ui.warn(" " + msg + "\n")
43 ui.warn(" " + msg + "\n")
43 errors[0] += 1
44 errors[0] += 1
44
45
45 def exc(linkrev, msg, inst, filename=None):
46 def exc(linkrev, msg, inst, filename=None):
46 if isinstance(inst, KeyboardInterrupt):
47 if isinstance(inst, KeyboardInterrupt):
47 ui.warn(_("interrupted"))
48 ui.warn(_("interrupted"))
48 raise
49 raise
49 err(linkrev, "%s: %s" % (msg, inst), filename)
50 err(linkrev, "%s: %s" % (msg, inst), filename)
50
51
51 def warn(msg):
52 def warn(msg):
52 ui.warn(msg + "\n")
53 ui.warn(msg + "\n")
53 warnings[0] += 1
54 warnings[0] += 1
54
55
55 def checklog(obj, name, linkrev):
56 def checklog(obj, name, linkrev):
56 if not len(obj) and (havecl or havemf):
57 if not len(obj) and (havecl or havemf):
57 err(linkrev, _("empty or missing %s") % name)
58 err(linkrev, _("empty or missing %s") % name)
58 return
59 return
59
60
60 d = obj.checksize()
61 d = obj.checksize()
61 if d[0]:
62 if d[0]:
62 err(None, _("data length off by %d bytes") % d[0], name)
63 err(None, _("data length off by %d bytes") % d[0], name)
63 if d[1]:
64 if d[1]:
64 err(None, _("index contains %d extra bytes") % d[1], name)
65 err(None, _("index contains %d extra bytes") % d[1], name)
65
66
66 if obj.version != revlog.REVLOGV0:
67 if obj.version != revlog.REVLOGV0:
67 if not revlogv1:
68 if not revlogv1:
68 warn(_("warning: `%s' uses revlog format 1") % name)
69 warn(_("warning: `%s' uses revlog format 1") % name)
69 elif revlogv1:
70 elif revlogv1:
70 warn(_("warning: `%s' uses revlog format 0") % name)
71 warn(_("warning: `%s' uses revlog format 0") % name)
71
72
72 def checkentry(obj, i, node, seen, linkrevs, f):
73 def checkentry(obj, i, node, seen, linkrevs, f):
73 lr = obj.linkrev(obj.rev(node))
74 lr = obj.linkrev(obj.rev(node))
74 if lr < 0 or (havecl and lr not in linkrevs):
75 if lr < 0 or (havecl and lr not in linkrevs):
75 if lr < 0 or lr >= len(cl):
76 if lr < 0 or lr >= len(cl):
76 msg = _("rev %d points to nonexistent changeset %d")
77 msg = _("rev %d points to nonexistent changeset %d")
77 else:
78 else:
78 msg = _("rev %d points to unexpected changeset %d")
79 msg = _("rev %d points to unexpected changeset %d")
79 err(None, msg % (i, lr), f)
80 err(None, msg % (i, lr), f)
80 if linkrevs:
81 if linkrevs:
82 if f and len(linkrevs) > 1:
83 try:
84 # attempt to filter down to real linkrevs
85 linkrevs = [l for l in linkrevs
86 if lrugetctx(l)[f].filenode() == node]
87 except:
88 pass
81 warn(_(" (expected %s)") % " ".join(map(str, linkrevs)))
89 warn(_(" (expected %s)") % " ".join(map(str, linkrevs)))
82 lr = None # can't be trusted
90 lr = None # can't be trusted
83
91
84 try:
92 try:
85 p1, p2 = obj.parents(node)
93 p1, p2 = obj.parents(node)
86 if p1 not in seen and p1 != nullid:
94 if p1 not in seen and p1 != nullid:
87 err(lr, _("unknown parent 1 %s of %s") %
95 err(lr, _("unknown parent 1 %s of %s") %
88 (short(p1), short(n)), f)
96 (short(p1), short(n)), f)
89 if p2 not in seen and p2 != nullid:
97 if p2 not in seen and p2 != nullid:
90 err(lr, _("unknown parent 2 %s of %s") %
98 err(lr, _("unknown parent 2 %s of %s") %
91 (short(p2), short(p1)), f)
99 (short(p2), short(p1)), f)
92 except Exception, inst:
100 except Exception, inst:
93 exc(lr, _("checking parents of %s") % short(node), inst, f)
101 exc(lr, _("checking parents of %s") % short(node), inst, f)
94
102
95 if node in seen:
103 if node in seen:
96 err(lr, _("duplicate revision %d (%d)") % (i, seen[n]), f)
104 err(lr, _("duplicate revision %d (%d)") % (i, seen[n]), f)
97 seen[n] = i
105 seen[n] = i
98 return lr
106 return lr
99
107
100 revlogv1 = cl.version != revlog.REVLOGV0
108 revlogv1 = cl.version != revlog.REVLOGV0
101 if ui.verbose or not revlogv1:
109 if ui.verbose or not revlogv1:
102 ui.status(_("repository uses revlog format %d\n") %
110 ui.status(_("repository uses revlog format %d\n") %
103 (revlogv1 and 1 or 0))
111 (revlogv1 and 1 or 0))
104
112
105 havecl = len(cl) > 0
113 havecl = len(cl) > 0
106 havemf = len(mf) > 0
114 havemf = len(mf) > 0
107
115
108 ui.status(_("checking changesets\n"))
116 ui.status(_("checking changesets\n"))
109 seen = {}
117 seen = {}
110 checklog(cl, "changelog", 0)
118 checklog(cl, "changelog", 0)
111 for i in repo:
119 for i in repo:
112 n = cl.node(i)
120 n = cl.node(i)
113 checkentry(cl, i, n, seen, [i], "changelog")
121 checkentry(cl, i, n, seen, [i], "changelog")
114
122
115 try:
123 try:
116 changes = cl.read(n)
124 changes = cl.read(n)
117 mflinkrevs.setdefault(changes[0], []).append(i)
125 mflinkrevs.setdefault(changes[0], []).append(i)
118 for f in changes[3]:
126 for f in changes[3]:
119 filelinkrevs.setdefault(f, []).append(i)
127 filelinkrevs.setdefault(f, []).append(i)
120 except Exception, inst:
128 except Exception, inst:
121 exc(i, _("unpacking changeset %s") % short(n), inst)
129 exc(i, _("unpacking changeset %s") % short(n), inst)
122
130
123 ui.status(_("checking manifests\n"))
131 ui.status(_("checking manifests\n"))
124 seen = {}
132 seen = {}
125 checklog(mf, "manifest", 0)
133 checklog(mf, "manifest", 0)
126 for i in mf:
134 for i in mf:
127 n = mf.node(i)
135 n = mf.node(i)
128 lr = checkentry(mf, i, n, seen, mflinkrevs.get(n, []), "manifest")
136 lr = checkentry(mf, i, n, seen, mflinkrevs.get(n, []), "manifest")
129 if n in mflinkrevs:
137 if n in mflinkrevs:
130 del mflinkrevs[n]
138 del mflinkrevs[n]
131 else:
139 else:
132 err(lr, _("%s not in changesets") % short(n), "manifest")
140 err(lr, _("%s not in changesets") % short(n), "manifest")
133
141
134 try:
142 try:
135 for f, fn in mf.readdelta(n).iteritems():
143 for f, fn in mf.readdelta(n).iteritems():
136 if not f:
144 if not f:
137 err(lr, _("file without name in manifest"))
145 err(lr, _("file without name in manifest"))
138 elif f != "/dev/null":
146 elif f != "/dev/null":
139 fns = filenodes.setdefault(f, {})
147 filenodes.setdefault(f, {}).setdefault(fn, lr)
140 if fn not in fns:
141 fns[fn] = i
142 except Exception, inst:
148 except Exception, inst:
143 exc(lr, _("reading manifest delta %s") % short(n), inst)
149 exc(lr, _("reading manifest delta %s") % short(n), inst)
144
150
145 ui.status(_("crosschecking files in changesets and manifests\n"))
151 ui.status(_("crosschecking files in changesets and manifests\n"))
146
152
147 if havemf:
153 if havemf:
148 for c,m in sorted([(c, m) for m in mflinkrevs for c in mflinkrevs[m]]):
154 for c,m in sorted([(c, m) for m in mflinkrevs for c in mflinkrevs[m]]):
149 err(c, _("changeset refers to unknown manifest %s") % short(m))
155 err(c, _("changeset refers to unknown manifest %s") % short(m))
150 mflinkrevs = None # del is bad here due to scope issues
156 mflinkrevs = None # del is bad here due to scope issues
151
157
152 for f in sorted(filelinkrevs):
158 for f in sorted(filelinkrevs):
153 if f not in filenodes:
159 if f not in filenodes:
154 lr = filelinkrevs[f][0]
160 lr = filelinkrevs[f][0]
155 err(lr, _("in changeset but not in manifest"), f)
161 err(lr, _("in changeset but not in manifest"), f)
156
162
157 if havecl:
163 if havecl:
158 for f in sorted(filenodes):
164 for f in sorted(filenodes):
159 if f not in filelinkrevs:
165 if f not in filelinkrevs:
160 try:
166 try:
161 fl = repo.file(f)
167 fl = repo.file(f)
162 lr = min([fl.linkrev(fl.rev(n)) for n in filenodes[f]])
168 lr = min([fl.linkrev(fl.rev(n)) for n in filenodes[f]])
163 except:
169 except:
164 lr = None
170 lr = None
165 err(lr, _("in manifest but not in changeset"), f)
171 err(lr, _("in manifest but not in changeset"), f)
166
172
167 ui.status(_("checking files\n"))
173 ui.status(_("checking files\n"))
168
174
169 storefiles = set()
175 storefiles = set()
170 for f, f2, size in repo.store.datafiles():
176 for f, f2, size in repo.store.datafiles():
171 if not f:
177 if not f:
172 err(None, _("cannot decode filename '%s'") % f2)
178 err(None, _("cannot decode filename '%s'") % f2)
173 elif size > 0:
179 elif size > 0:
174 storefiles.add(f)
180 storefiles.add(f)
175
181
176 lrugetctx = util.lrucachefunc(repo.changectx)
177 files = sorted(set(filenodes) | set(filelinkrevs))
182 files = sorted(set(filenodes) | set(filelinkrevs))
178 for f in files:
183 for f in files:
179 try:
184 try:
180 linkrevs = filelinkrevs[f]
185 linkrevs = filelinkrevs[f]
181 except KeyError:
186 except KeyError:
182 # in manifest but not in changelog
187 # in manifest but not in changelog
183 linkrevs = []
188 linkrevs = []
184
189
185 if linkrevs:
190 if linkrevs:
186 lr = linkrevs[0]
191 lr = linkrevs[0]
187 else:
192 else:
188 lr = None
193 lr = None
189
194
190 try:
195 try:
191 fl = repo.file(f)
196 fl = repo.file(f)
192 except error.RevlogError, e:
197 except error.RevlogError, e:
193 err(lr, _("broken revlog! (%s)") % e, f)
198 err(lr, _("broken revlog! (%s)") % e, f)
194 continue
199 continue
195
200
196 for ff in fl.files():
201 for ff in fl.files():
197 try:
202 try:
198 storefiles.remove(ff)
203 storefiles.remove(ff)
199 except KeyError:
204 except KeyError:
200 err(lr, _("missing revlog!"), ff)
205 err(lr, _("missing revlog!"), ff)
201
206
202 checklog(fl, f, lr)
207 checklog(fl, f, lr)
203 seen = {}
208 seen = {}
204 for i in fl:
209 for i in fl:
205 revisions += 1
210 revisions += 1
206 n = fl.node(i)
211 n = fl.node(i)
207 lr = checkentry(fl, i, n, seen, linkrevs, f)
212 lr = checkentry(fl, i, n, seen, linkrevs, f)
208 if f in filenodes:
213 if f in filenodes:
209 if havemf and n not in filenodes[f]:
214 if havemf and n not in filenodes[f]:
210 err(lr, _("%s not in manifests") % (short(n)), f)
215 err(lr, _("%s not in manifests") % (short(n)), f)
211 else:
216 else:
212 del filenodes[f][n]
217 del filenodes[f][n]
213
218
214 # verify contents
219 # verify contents
215 try:
220 try:
216 t = fl.read(n)
221 t = fl.read(n)
217 rp = fl.renamed(n)
222 rp = fl.renamed(n)
218 if len(t) != fl.size(i):
223 if len(t) != fl.size(i):
219 if len(fl.revision(n)) != fl.size(i):
224 if len(fl.revision(n)) != fl.size(i):
220 err(lr, _("unpacked size is %s, %s expected") %
225 err(lr, _("unpacked size is %s, %s expected") %
221 (len(t), fl.size(i)), f)
226 (len(t), fl.size(i)), f)
222 except Exception, inst:
227 except Exception, inst:
223 exc(lr, _("unpacking %s") % short(n), inst, f)
228 exc(lr, _("unpacking %s") % short(n), inst, f)
224
229
225 # check renames
230 # check renames
226 try:
231 try:
227 if rp:
232 if rp:
228 if lr is not None and ui.verbose:
233 if lr is not None and ui.verbose:
229 ctx = lrugetctx(lr)
234 ctx = lrugetctx(lr)
230 found = False
235 found = False
231 for pctx in ctx.parents():
236 for pctx in ctx.parents():
232 if rp[0] in pctx:
237 if rp[0] in pctx:
233 found = True
238 found = True
234 break
239 break
235 if not found:
240 if not found:
236 warn(_("warning: copy source of '%s' not"
241 warn(_("warning: copy source of '%s' not"
237 " in parents of %s") % (f, ctx))
242 " in parents of %s") % (f, ctx))
238 fl2 = repo.file(rp[0])
243 fl2 = repo.file(rp[0])
239 if not len(fl2):
244 if not len(fl2):
240 err(lr, _("empty or missing copy source revlog %s:%s")
245 err(lr, _("empty or missing copy source revlog %s:%s")
241 % (rp[0], short(rp[1])), f)
246 % (rp[0], short(rp[1])), f)
242 elif rp[1] == nullid:
247 elif rp[1] == nullid:
243 ui.note(_("warning: %s@%s: copy source"
248 ui.note(_("warning: %s@%s: copy source"
244 " revision is nullid %s:%s\n")
249 " revision is nullid %s:%s\n")
245 % (f, lr, rp[0], short(rp[1])))
250 % (f, lr, rp[0], short(rp[1])))
246 else:
251 else:
247 fl2.rev(rp[1])
252 fl2.rev(rp[1])
248 except Exception, inst:
253 except Exception, inst:
249 exc(lr, _("checking rename of %s") % short(n), inst, f)
254 exc(lr, _("checking rename of %s") % short(n), inst, f)
250
255
251 # cross-check
256 # cross-check
252 if f in filenodes:
257 if f in filenodes:
253 fns = [(mf.linkrev(l), n) for n,l in filenodes[f].iteritems()]
258 fns = [(lr, n) for n,lr in filenodes[f].iteritems()]
254 for lr, node in sorted(fns):
259 for lr, node in sorted(fns):
255 err(lr, _("%s in manifests not found") % short(node), f)
260 err(lr, _("%s in manifests not found") % short(node), f)
256
261
257 for f in storefiles:
262 for f in storefiles:
258 warn(_("warning: orphan revlog '%s'") % f)
263 warn(_("warning: orphan revlog '%s'") % f)
259
264
260 ui.status(_("%d files, %d changesets, %d total revisions\n") %
265 ui.status(_("%d files, %d changesets, %d total revisions\n") %
261 (len(files), len(cl), revisions))
266 (len(files), len(cl), revisions))
262 if warnings[0]:
267 if warnings[0]:
263 ui.warn(_("%d warnings encountered!\n") % warnings[0])
268 ui.warn(_("%d warnings encountered!\n") % warnings[0])
264 if errors[0]:
269 if errors[0]:
265 ui.warn(_("%d integrity errors encountered!\n") % errors[0])
270 ui.warn(_("%d integrity errors encountered!\n") % errors[0])
266 if badrevs:
271 if badrevs:
267 ui.warn(_("(first damaged changeset appears to be %d)\n")
272 ui.warn(_("(first damaged changeset appears to be %d)\n")
268 % min(badrevs))
273 % min(badrevs))
269 return 1
274 return 1
General Comments 0
You need to be logged in to leave comments. Login now