##// END OF EJS Templates
store: initialize vfs field first to use it for initialization of others...
FUJIWARA Katsunori -
r17724:bf4b72d8 default
parent child Browse files
Show More
@@ -1,499 +1,499
1 1 # store.py - repository store handling for Mercurial
2 2 #
3 3 # Copyright 2008 Matt Mackall <mpm@selenic.com>
4 4 #
5 5 # This software may be used and distributed according to the terms of the
6 6 # GNU General Public License version 2 or any later version.
7 7
8 8 from i18n import _
9 9 import osutil, scmutil, util, parsers
10 10 import os, stat, errno
11 11
12 12 _sha = util.sha1
13 13
14 14 # This avoids a collision between a file named foo and a dir named
15 15 # foo.i or foo.d
16 16 def _encodedir(path):
17 17 '''
18 18 >>> _encodedir('data/foo.i')
19 19 'data/foo.i'
20 20 >>> _encodedir('data/foo.i/bla.i')
21 21 'data/foo.i.hg/bla.i'
22 22 >>> _encodedir('data/foo.i.hg/bla.i')
23 23 'data/foo.i.hg.hg/bla.i'
24 24 >>> _encodedir('data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')
25 25 'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'
26 26 '''
27 27 return (path
28 28 .replace(".hg/", ".hg.hg/")
29 29 .replace(".i/", ".i.hg/")
30 30 .replace(".d/", ".d.hg/"))
31 31
32 32 encodedir = getattr(parsers, 'encodedir', _encodedir)
33 33
34 34 def decodedir(path):
35 35 '''
36 36 >>> decodedir('data/foo.i')
37 37 'data/foo.i'
38 38 >>> decodedir('data/foo.i.hg/bla.i')
39 39 'data/foo.i/bla.i'
40 40 >>> decodedir('data/foo.i.hg.hg/bla.i')
41 41 'data/foo.i.hg/bla.i'
42 42 '''
43 43 if ".hg/" not in path:
44 44 return path
45 45 return (path
46 46 .replace(".d.hg/", ".d/")
47 47 .replace(".i.hg/", ".i/")
48 48 .replace(".hg.hg/", ".hg/"))
49 49
50 50 def _buildencodefun():
51 51 '''
52 52 >>> enc, dec = _buildencodefun()
53 53
54 54 >>> enc('nothing/special.txt')
55 55 'nothing/special.txt'
56 56 >>> dec('nothing/special.txt')
57 57 'nothing/special.txt'
58 58
59 59 >>> enc('HELLO')
60 60 '_h_e_l_l_o'
61 61 >>> dec('_h_e_l_l_o')
62 62 'HELLO'
63 63
64 64 >>> enc('hello:world?')
65 65 'hello~3aworld~3f'
66 66 >>> dec('hello~3aworld~3f')
67 67 'hello:world?'
68 68
69 69 >>> enc('the\x07quick\xADshot')
70 70 'the~07quick~adshot'
71 71 >>> dec('the~07quick~adshot')
72 72 'the\\x07quick\\xadshot'
73 73 '''
74 74 e = '_'
75 75 winreserved = [ord(x) for x in '\\:*?"<>|']
76 76 cmap = dict([(chr(x), chr(x)) for x in xrange(127)])
77 77 for x in (range(32) + range(126, 256) + winreserved):
78 78 cmap[chr(x)] = "~%02x" % x
79 79 for x in range(ord("A"), ord("Z")+1) + [ord(e)]:
80 80 cmap[chr(x)] = e + chr(x).lower()
81 81 dmap = {}
82 82 for k, v in cmap.iteritems():
83 83 dmap[v] = k
84 84 def decode(s):
85 85 i = 0
86 86 while i < len(s):
87 87 for l in xrange(1, 4):
88 88 try:
89 89 yield dmap[s[i:i + l]]
90 90 i += l
91 91 break
92 92 except KeyError:
93 93 pass
94 94 else:
95 95 raise KeyError
96 96 return (lambda s: ''.join([cmap[c] for c in s]),
97 97 lambda s: ''.join(list(decode(s))))
98 98
99 99 _encodefname, _decodefname = _buildencodefun()
100 100
101 101 def encodefilename(s):
102 102 '''
103 103 >>> encodefilename('foo.i/bar.d/bla.hg/hi:world?/HELLO')
104 104 'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'
105 105 '''
106 106 return _encodefname(encodedir(s))
107 107
108 108 def decodefilename(s):
109 109 '''
110 110 >>> decodefilename('foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')
111 111 'foo.i/bar.d/bla.hg/hi:world?/HELLO'
112 112 '''
113 113 return decodedir(_decodefname(s))
114 114
115 115 def _buildlowerencodefun():
116 116 '''
117 117 >>> f = _buildlowerencodefun()
118 118 >>> f('nothing/special.txt')
119 119 'nothing/special.txt'
120 120 >>> f('HELLO')
121 121 'hello'
122 122 >>> f('hello:world?')
123 123 'hello~3aworld~3f'
124 124 >>> f('the\x07quick\xADshot')
125 125 'the~07quick~adshot'
126 126 '''
127 127 winreserved = [ord(x) for x in '\\:*?"<>|']
128 128 cmap = dict([(chr(x), chr(x)) for x in xrange(127)])
129 129 for x in (range(32) + range(126, 256) + winreserved):
130 130 cmap[chr(x)] = "~%02x" % x
131 131 for x in range(ord("A"), ord("Z")+1):
132 132 cmap[chr(x)] = chr(x).lower()
133 133 return lambda s: "".join([cmap[c] for c in s])
134 134
135 135 lowerencode = _buildlowerencodefun()
136 136
137 137 # Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9
138 138 _winres3 = ('aux', 'con', 'prn', 'nul') # length 3
139 139 _winres4 = ('com', 'lpt') # length 4 (with trailing 1..9)
140 140 def _auxencode(path, dotencode):
141 141 '''
142 142 Encodes filenames containing names reserved by Windows or which end in
143 143 period or space. Does not touch other single reserved characters c.
144 144 Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.
145 145 Additionally encodes space or period at the beginning, if dotencode is
146 146 True. Parameter path is assumed to be all lowercase.
147 147 A segment only needs encoding if a reserved name appears as a
148 148 basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"
149 149 doesn't need encoding.
150 150
151 151 >>> s = '.foo/aux.txt/txt.aux/con/prn/nul/foo.'
152 152 >>> _auxencode(s.split('/'), True)
153 153 ['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']
154 154 >>> s = '.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'
155 155 >>> _auxencode(s.split('/'), False)
156 156 ['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']
157 157 >>> _auxencode(['foo. '], True)
158 158 ['foo.~20']
159 159 >>> _auxencode([' .foo'], True)
160 160 ['~20.foo']
161 161 '''
162 162 for i, n in enumerate(path):
163 163 if not n:
164 164 continue
165 165 if dotencode and n[0] in '. ':
166 166 n = "~%02x" % ord(n[0]) + n[1:]
167 167 path[i] = n
168 168 else:
169 169 l = n.find('.')
170 170 if l == -1:
171 171 l = len(n)
172 172 if ((l == 3 and n[:3] in _winres3) or
173 173 (l == 4 and n[3] <= '9' and n[3] >= '1'
174 174 and n[:3] in _winres4)):
175 175 # encode third letter ('aux' -> 'au~78')
176 176 ec = "~%02x" % ord(n[2])
177 177 n = n[0:2] + ec + n[3:]
178 178 path[i] = n
179 179 if n[-1] in '. ':
180 180 # encode last period or space ('foo...' -> 'foo..~2e')
181 181 path[i] = n[:-1] + "~%02x" % ord(n[-1])
182 182 return path
183 183
184 184 _maxstorepathlen = 120
185 185 _dirprefixlen = 8
186 186 _maxshortdirslen = 8 * (_dirprefixlen + 1) - 4
187 187
188 188 def _hashencode(path, dotencode):
189 189 digest = _sha(path).hexdigest()
190 190 le = lowerencode(path).split('/')[1:]
191 191 parts = _auxencode(le, dotencode)
192 192 basename = parts[-1]
193 193 _root, ext = os.path.splitext(basename)
194 194 sdirs = []
195 195 sdirslen = 0
196 196 for p in parts[:-1]:
197 197 d = p[:_dirprefixlen]
198 198 if d[-1] in '. ':
199 199 # Windows can't access dirs ending in period or space
200 200 d = d[:-1] + '_'
201 201 if sdirslen == 0:
202 202 t = len(d)
203 203 else:
204 204 t = sdirslen + 1 + len(d)
205 205 if t > _maxshortdirslen:
206 206 break
207 207 sdirs.append(d)
208 208 sdirslen = t
209 209 dirs = '/'.join(sdirs)
210 210 if len(dirs) > 0:
211 211 dirs += '/'
212 212 res = 'dh/' + dirs + digest + ext
213 213 spaceleft = _maxstorepathlen - len(res)
214 214 if spaceleft > 0:
215 215 filler = basename[:spaceleft]
216 216 res = 'dh/' + dirs + filler + digest + ext
217 217 return res
218 218
219 219 def _hybridencode(path, dotencode):
220 220 '''encodes path with a length limit
221 221
222 222 Encodes all paths that begin with 'data/', according to the following.
223 223
224 224 Default encoding (reversible):
225 225
226 226 Encodes all uppercase letters 'X' as '_x'. All reserved or illegal
227 227 characters are encoded as '~xx', where xx is the two digit hex code
228 228 of the character (see encodefilename).
229 229 Relevant path components consisting of Windows reserved filenames are
230 230 masked by encoding the third character ('aux' -> 'au~78', see auxencode).
231 231
232 232 Hashed encoding (not reversible):
233 233
234 234 If the default-encoded path is longer than _maxstorepathlen, a
235 235 non-reversible hybrid hashing of the path is done instead.
236 236 This encoding uses up to _dirprefixlen characters of all directory
237 237 levels of the lowerencoded path, but not more levels than can fit into
238 238 _maxshortdirslen.
239 239 Then follows the filler followed by the sha digest of the full path.
240 240 The filler is the beginning of the basename of the lowerencoded path
241 241 (the basename is everything after the last path separator). The filler
242 242 is as long as possible, filling in characters from the basename until
243 243 the encoded path has _maxstorepathlen characters (or all chars of the
244 244 basename have been taken).
245 245 The extension (e.g. '.i' or '.d') is preserved.
246 246
247 247 The string 'data/' at the beginning is replaced with 'dh/', if the hashed
248 248 encoding was used.
249 249 '''
250 250 path = encodedir(path)
251 251 ef = _encodefname(path).split('/')
252 252 res = '/'.join(_auxencode(ef, dotencode))
253 253 if len(res) > _maxstorepathlen:
254 254 res = _hashencode(path, dotencode)
255 255 return res
256 256
257 257 def _pathencode(path):
258 258 if len(path) > _maxstorepathlen:
259 259 return None
260 260 ef = _encodefname(encodedir(path)).split('/')
261 261 res = '/'.join(_auxencode(ef, True))
262 262 if len(res) > _maxstorepathlen:
263 263 return None
264 264 return res
265 265
266 266 _pathencode = getattr(parsers, 'pathencode', _pathencode)
267 267
268 268 def _dothybridencode(f):
269 269 ef = _pathencode(f)
270 270 if ef is None:
271 271 return _hashencode(encodedir(f), True)
272 272 return ef
273 273
274 274 def _plainhybridencode(f):
275 275 return _hybridencode(f, False)
276 276
277 277 def _calcmode(path):
278 278 try:
279 279 # files in .hg/ will be created using this mode
280 280 mode = os.stat(path).st_mode
281 281 # avoid some useless chmods
282 282 if (0777 & ~util.umask) == (0777 & mode):
283 283 mode = None
284 284 except OSError:
285 285 mode = None
286 286 return mode
287 287
288 288 _data = ('data 00manifest.d 00manifest.i 00changelog.d 00changelog.i'
289 289 ' phaseroots obsstore')
290 290
291 291 class basicstore(object):
292 292 '''base class for local repository stores'''
293 293 def __init__(self, path, vfstype):
294 self.path = path
294 vfs = vfstype(path)
295 self.path = vfs.base
295 296 self.createmode = _calcmode(path)
296 vfs = vfstype(self.path)
297 297 vfs.createmode = self.createmode
298 298 self.vfs = scmutil.filtervfs(vfs, encodedir)
299 299 self.opener = self.vfs
300 300
301 301 def join(self, f):
302 302 return self.path + '/' + encodedir(f)
303 303
304 304 def _walk(self, relpath, recurse):
305 305 '''yields (unencoded, encoded, size)'''
306 306 path = self.path
307 307 if relpath:
308 308 path += '/' + relpath
309 309 striplen = len(self.path) + 1
310 310 l = []
311 311 if os.path.isdir(path):
312 312 visit = [path]
313 313 while visit:
314 314 p = visit.pop()
315 315 for f, kind, st in osutil.listdir(p, stat=True):
316 316 fp = p + '/' + f
317 317 if kind == stat.S_IFREG and f[-2:] in ('.d', '.i'):
318 318 n = util.pconvert(fp[striplen:])
319 319 l.append((decodedir(n), n, st.st_size))
320 320 elif kind == stat.S_IFDIR and recurse:
321 321 visit.append(fp)
322 322 l.sort()
323 323 return l
324 324
325 325 def datafiles(self):
326 326 return self._walk('data', True)
327 327
328 328 def walk(self):
329 329 '''yields (unencoded, encoded, size)'''
330 330 # yield data files first
331 331 for x in self.datafiles():
332 332 yield x
333 333 # yield manifest before changelog
334 334 for x in reversed(self._walk('', False)):
335 335 yield x
336 336
337 337 def copylist(self):
338 338 return ['requires'] + _data.split()
339 339
340 340 def write(self):
341 341 pass
342 342
343 343 class encodedstore(basicstore):
344 344 def __init__(self, path, vfstype):
345 self.path = path + '/store'
345 vfs = vfstype(path + '/store')
346 self.path = vfs.base
346 347 self.createmode = _calcmode(self.path)
347 vfs = vfstype(self.path)
348 348 vfs.createmode = self.createmode
349 349 self.vfs = scmutil.filtervfs(vfs, encodefilename)
350 350 self.opener = self.vfs
351 351
352 352 def datafiles(self):
353 353 for a, b, size in self._walk('data', True):
354 354 try:
355 355 a = decodefilename(a)
356 356 except KeyError:
357 357 a = None
358 358 yield a, b, size
359 359
360 360 def join(self, f):
361 361 return self.path + '/' + encodefilename(f)
362 362
363 363 def copylist(self):
364 364 return (['requires', '00changelog.i'] +
365 365 ['store/' + f for f in _data.split()])
366 366
367 367 class fncache(object):
368 368 # the filename used to be partially encoded
369 369 # hence the encodedir/decodedir dance
370 370 def __init__(self, vfs):
371 371 self.vfs = vfs
372 372 self.entries = None
373 373 self._dirty = False
374 374
375 375 def _load(self):
376 376 '''fill the entries from the fncache file'''
377 377 self._dirty = False
378 378 try:
379 379 fp = self.vfs('fncache', mode='rb')
380 380 except IOError:
381 381 # skip nonexistent file
382 382 self.entries = set()
383 383 return
384 384 self.entries = set(decodedir(fp.read()).splitlines())
385 385 if '' in self.entries:
386 386 fp.seek(0)
387 387 for n, line in enumerate(fp):
388 388 if not line.rstrip('\n'):
389 389 t = _('invalid entry in fncache, line %s') % (n + 1)
390 390 raise util.Abort(t)
391 391 fp.close()
392 392
393 393 def _write(self, files, atomictemp):
394 394 fp = self.vfs('fncache', mode='wb', atomictemp=atomictemp)
395 395 if files:
396 396 fp.write(encodedir('\n'.join(files) + '\n'))
397 397 fp.close()
398 398 self._dirty = False
399 399
400 400 def rewrite(self, files):
401 401 self._write(files, False)
402 402 self.entries = set(files)
403 403
404 404 def write(self):
405 405 if self._dirty:
406 406 self._write(self.entries, True)
407 407
408 408 def add(self, fn):
409 409 if self.entries is None:
410 410 self._load()
411 411 if fn not in self.entries:
412 412 self._dirty = True
413 413 self.entries.add(fn)
414 414
415 415 def __contains__(self, fn):
416 416 if self.entries is None:
417 417 self._load()
418 418 return fn in self.entries
419 419
420 420 def __iter__(self):
421 421 if self.entries is None:
422 422 self._load()
423 423 return iter(self.entries)
424 424
425 425 class _fncachevfs(scmutil.abstractvfs):
426 426 def __init__(self, vfs, fnc, encode):
427 427 self.vfs = vfs
428 428 self.fncache = fnc
429 429 self.encode = encode
430 430
431 431 def _getmustaudit(self):
432 432 return self.vfs.mustaudit
433 433
434 434 def _setmustaudit(self, onoff):
435 435 self.vfs.mustaudit = onoff
436 436
437 437 mustaudit = property(_getmustaudit, _setmustaudit)
438 438
439 439 def __call__(self, path, mode='r', *args, **kw):
440 440 if mode not in ('r', 'rb') and path.startswith('data/'):
441 441 self.fncache.add(path)
442 442 return self.vfs(self.encode(path), mode, *args, **kw)
443 443
444 444 class fncachestore(basicstore):
445 445 def __init__(self, path, vfstype, dotencode):
446 446 if dotencode:
447 447 encode = _dothybridencode
448 448 else:
449 449 encode = _plainhybridencode
450 450 self.encode = encode
451 self.path = path + '/store'
451 vfs = vfstype(path + '/store')
452 self.path = vfs.base
452 453 self.pathsep = self.path + '/'
453 454 self.createmode = _calcmode(self.path)
454 vfs = vfstype(self.path)
455 455 vfs.createmode = self.createmode
456 456 fnc = fncache(vfs)
457 457 self.fncache = fnc
458 458 self.vfs = _fncachevfs(vfs, fnc, encode)
459 459 self.opener = self.vfs
460 460
461 461 def join(self, f):
462 462 return self.pathsep + self.encode(f)
463 463
464 464 def getsize(self, path):
465 465 return os.stat(self.pathsep + path).st_size
466 466
467 467 def datafiles(self):
468 468 rewrite = False
469 469 existing = []
470 470 for f in sorted(self.fncache):
471 471 ef = self.encode(f)
472 472 try:
473 473 yield f, ef, self.getsize(ef)
474 474 existing.append(f)
475 475 except OSError, err:
476 476 if err.errno != errno.ENOENT:
477 477 raise
478 478 # nonexistent entry
479 479 rewrite = True
480 480 if rewrite:
481 481 # rewrite fncache to remove nonexistent entries
482 482 # (may be caused by rollback / strip)
483 483 self.fncache.rewrite(existing)
484 484
485 485 def copylist(self):
486 486 d = ('data dh fncache phaseroots obsstore'
487 487 ' 00manifest.d 00manifest.i 00changelog.d 00changelog.i')
488 488 return (['requires', '00changelog.i'] +
489 489 ['store/' + f for f in d.split()])
490 490
491 491 def write(self):
492 492 self.fncache.write()
493 493
494 494 def store(requirements, path, vfstype):
495 495 if 'store' in requirements:
496 496 if 'fncache' in requirements:
497 497 return fncachestore(path, vfstype, 'dotencode' in requirements)
498 498 return encodedstore(path, vfstype)
499 499 return basicstore(path, vfstype)
General Comments 0
You need to be logged in to leave comments. Login now