upstream/mercurial-mirror Commit - r48589:59bc92a7

1

# store.py - repository store handling for Mercurial

1

# store.py - repository store handling for Mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import errno

10

import errno

11

import functools

11

import functools

12

import os

12

import os

13

import re

13

import re

14

import stat

14

import stat

15

16

from .i18n import _

16

from .i18n import _

17

from .pycompat import getattr

17

from .pycompat import getattr

18

from .node import hex

18

from .node import hex

19

from . import (

19

from . import (

20

changelog,

20

changelog,

21

error,

21

error,

22

manifest,

22

manifest,

23

policy,

23

policy,

24

pycompat,

24

pycompat,

25

util,

25

util,

26

vfs as vfsmod,

26

vfs as vfsmod,

27

)

27

)

28

from .utils import hashutil

28

from .utils import hashutil

29

30

parsers = policy.importmod('parsers')

30

parsers = policy.importmod('parsers')

31

# how much bytes should be read from fncache in one read

31

# how much bytes should be read from fncache in one read

32

# It is done to prevent loading large fncache files into memory

32

# It is done to prevent loading large fncache files into memory

33

fncache_chunksize = 10 ** 6

33

fncache_chunksize = 10 ** 6

34

35

36

def _matchtrackedpath(path, matcher):

36

def _matchtrackedpath(path, matcher):

37

"""parses a fncache entry and returns whether the entry is tracking a path

37

"""parses a fncache entry and returns whether the entry is tracking a path

38

matched by matcher or not.

38

matched by matcher or not.

39

40

If matcher is None, returns True"""

40

If matcher is None, returns True"""

41

42

if matcher is None:

42

if matcher is None:

43

return True

43

return True

44

path = decodedir(path)

44

path = decodedir(path)

45

if path.startswith(b'data/'):

45

if path.startswith(b'data/'):

46

return matcher(path[len(b'data/') : -len(b'.i')])

46

return matcher(path[len(b'data/') : -len(b'.i')])

47

elif path.startswith(b'meta/'):

47

elif path.startswith(b'meta/'):

48

return matcher.visitdir(path[len(b'meta/') : -len(b'/00manifest.i')])

48

return matcher.visitdir(path[len(b'meta/') : -len(b'/00manifest.i')])

49

50

raise error.ProgrammingError(b"cannot decode path %s" % path)

50

raise error.ProgrammingError(b"cannot decode path %s" % path)

51

52

53

# This avoids a collision between a file named foo and a dir named

53

# This avoids a collision between a file named foo and a dir named

54

# foo.i or foo.d

54

# foo.i or foo.d

55

def _encodedir(path):

55

def _encodedir(path):

56

"""

56

"""

57

>>> _encodedir(b'data/foo.i')

57

>>> _encodedir(b'data/foo.i')

58

'data/foo.i'

58

'data/foo.i'

59

>>> _encodedir(b'data/foo.i/bla.i')

59

>>> _encodedir(b'data/foo.i/bla.i')

60

'data/foo.i.hg/bla.i'

60

'data/foo.i.hg/bla.i'

61

>>> _encodedir(b'data/foo.i.hg/bla.i')

61

>>> _encodedir(b'data/foo.i.hg/bla.i')

62

'data/foo.i.hg.hg/bla.i'

62

'data/foo.i.hg.hg/bla.i'

63

>>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')

63

>>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')

64

'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'

64

'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'

65

"""

65

"""

66

return (

66

return (

67

path.replace(b".hg/", b".hg.hg/")

67

path.replace(b".hg/", b".hg.hg/")

68

.replace(b".i/", b".i.hg/")

68

.replace(b".i/", b".i.hg/")

69

.replace(b".d/", b".d.hg/")

69

.replace(b".d/", b".d.hg/")

70

)

70

)

71

72

73

encodedir = getattr(parsers, 'encodedir', _encodedir)

73

encodedir = getattr(parsers, 'encodedir', _encodedir)

74

75

76

def decodedir(path):

76

def decodedir(path):

77

"""

77

"""

78

>>> decodedir(b'data/foo.i')

78

>>> decodedir(b'data/foo.i')

79

'data/foo.i'

79

'data/foo.i'

80

>>> decodedir(b'data/foo.i.hg/bla.i')

80

>>> decodedir(b'data/foo.i.hg/bla.i')

81

'data/foo.i/bla.i'

81

'data/foo.i/bla.i'

82

>>> decodedir(b'data/foo.i.hg.hg/bla.i')

82

>>> decodedir(b'data/foo.i.hg.hg/bla.i')

83

'data/foo.i.hg/bla.i'

83

'data/foo.i.hg/bla.i'

84

"""

84

"""

85

if b".hg/" not in path:

85

if b".hg/" not in path:

86

return path

86

return path

87

return (

87

return (

88

path.replace(b".d.hg/", b".d/")

88

path.replace(b".d.hg/", b".d/")

89

.replace(b".i.hg/", b".i/")

89

.replace(b".i.hg/", b".i/")

90

.replace(b".hg.hg/", b".hg/")

90

.replace(b".hg.hg/", b".hg/")

91

)

91

)

92

93

94

def _reserved():

94

def _reserved():

95

"""characters that are problematic for filesystems

95

"""characters that are problematic for filesystems

96

97

* ascii escapes (0..31)

97

* ascii escapes (0..31)

98

* ascii hi (126..255)

98

* ascii hi (126..255)

99

* windows specials

99

* windows specials

100

101

these characters will be escaped by encodefunctions

101

these characters will be escaped by encodefunctions

102

"""

102

"""

103

winreserved = [ord(x) for x in u'\\:*?"<>|']

103

winreserved = [ord(x) for x in u'\\:*?"<>|']

104

for x in range(32):

104

for x in range(32):

105

yield x

105

yield x

106

for x in range(126, 256):

106

for x in range(126, 256):

107

yield x

107

yield x

108

for x in winreserved:

108

for x in winreserved:

109

yield x

109

yield x

110

111

112

def _buildencodefun():

112

def _buildencodefun():

113

"""

113

"""

114

>>> enc, dec = _buildencodefun()

114

>>> enc, dec = _buildencodefun()

115

116

>>> enc(b'nothing/special.txt')

116

>>> enc(b'nothing/special.txt')

117

'nothing/special.txt'

117

'nothing/special.txt'

118

>>> dec(b'nothing/special.txt')

118

>>> dec(b'nothing/special.txt')

119

'nothing/special.txt'

119

'nothing/special.txt'

120

121

>>> enc(b'HELLO')

121

>>> enc(b'HELLO')

122

'_h_e_l_l_o'

122

'_h_e_l_l_o'

123

>>> dec(b'_h_e_l_l_o')

123

>>> dec(b'_h_e_l_l_o')

124

'HELLO'

124

'HELLO'

125

126

>>> enc(b'hello:world?')

126

>>> enc(b'hello:world?')

127

'hello~3aworld~3f'

127

'hello~3aworld~3f'

128

>>> dec(b'hello~3aworld~3f')

128

>>> dec(b'hello~3aworld~3f')

129

'hello:world?'

129

'hello:world?'

130

131

>>> enc(b'the\\x07quick\\xADshot')

131

>>> enc(b'the\\x07quick\\xADshot')

132

'the~07quick~adshot'

132

'the~07quick~adshot'

133

>>> dec(b'the~07quick~adshot')

133

>>> dec(b'the~07quick~adshot')

134

'the\\x07quick\\xadshot'

134

'the\\x07quick\\xadshot'

135

"""

135

"""

136

e = b'_'

136

e = b'_'

137

xchr = pycompat.bytechr

137

xchr = pycompat.bytechr

138

asciistr = list(map(xchr, range(127)))

138

asciistr = list(map(xchr, range(127)))

139

capitals = list(range(ord(b"A"), ord(b"Z") + 1))

139

capitals = list(range(ord(b"A"), ord(b"Z") + 1))

140

141

cmap = {x: x for x in asciistr}

141

cmap = {x: x for x in asciistr}

142

for x in _reserved():

142

for x in _reserved():

143

cmap[xchr(x)] = b"~%02x" % x

143

cmap[xchr(x)] = b"~%02x" % x

144

for x in capitals + [ord(e)]:

144

for x in capitals + [ord(e)]:

145

cmap[xchr(x)] = e + xchr(x).lower()

145

cmap[xchr(x)] = e + xchr(x).lower()

146

147

dmap = {}

147

dmap = {}

148

for k, v in pycompat.iteritems(cmap):

148

for k, v in pycompat.iteritems(cmap):

149

dmap[v] = k

149

dmap[v] = k

150

151

def decode(s):

151

def decode(s):

152

i = 0

152

i = 0

153

while i < len(s):

153

while i < len(s):

154

for l in pycompat.xrange(1, 4):

154

for l in pycompat.xrange(1, 4):

155

try:

155

try:

156

yield dmap[s[i : i + l]]

156

yield dmap[s[i : i + l]]

157

i += l

157

i += l

158

break

158

break

159

except KeyError:

159

except KeyError:

160

pass

160

pass

161

else:

161

else:

162

raise KeyError

162

raise KeyError

163

164

return (

164

return (

165

lambda s: b''.join(

165

lambda s: b''.join(

166

[cmap[s[c : c + 1]] for c in pycompat.xrange(len(s))]

166

[cmap[s[c : c + 1]] for c in pycompat.xrange(len(s))]

167

),

167

),

168

lambda s: b''.join(list(decode(s))),

168

lambda s: b''.join(list(decode(s))),

169

)

169

)

170

171

172

_encodefname, _decodefname = _buildencodefun()

172

_encodefname, _decodefname = _buildencodefun()

173

174

175

def encodefilename(s):

175

def encodefilename(s):

176

"""

176

"""

177

>>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')

177

>>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')

178

'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'

178

'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'

179

"""

179

"""

180

return _encodefname(encodedir(s))

180

return _encodefname(encodedir(s))

181

182

183

def decodefilename(s):

183

def decodefilename(s):

184

"""

184

"""

185

>>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')

185

>>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')

186

'foo.i/bar.d/bla.hg/hi:world?/HELLO'

186

'foo.i/bar.d/bla.hg/hi:world?/HELLO'

187

"""

187

"""

188

return decodedir(_decodefname(s))

188

return decodedir(_decodefname(s))

189

190

191

def _buildlowerencodefun():

191

def _buildlowerencodefun():

192

"""

192

"""

193

>>> f = _buildlowerencodefun()

193

>>> f = _buildlowerencodefun()

194

>>> f(b'nothing/special.txt')

194

>>> f(b'nothing/special.txt')

195

'nothing/special.txt'

195

'nothing/special.txt'

196

>>> f(b'HELLO')

196

>>> f(b'HELLO')

197

'hello'

197

'hello'

198

>>> f(b'hello:world?')

198

>>> f(b'hello:world?')

199

'hello~3aworld~3f'

199

'hello~3aworld~3f'

200

>>> f(b'the\\x07quick\\xADshot')

200

>>> f(b'the\\x07quick\\xADshot')

201

'the~07quick~adshot'

201

'the~07quick~adshot'

202

"""

202

"""

203

xchr = pycompat.bytechr

203

xchr = pycompat.bytechr

204

cmap = {xchr(x): xchr(x) for x in pycompat.xrange(127)}

204

cmap = {xchr(x): xchr(x) for x in pycompat.xrange(127)}

205

for x in _reserved():

205

for x in _reserved():

206

cmap[xchr(x)] = b"~%02x" % x

206

cmap[xchr(x)] = b"~%02x" % x

207

for x in range(ord(b"A"), ord(b"Z") + 1):

207

for x in range(ord(b"A"), ord(b"Z") + 1):

208

cmap[xchr(x)] = xchr(x).lower()

208

cmap[xchr(x)] = xchr(x).lower()

209

210

def lowerencode(s):

210

def lowerencode(s):

211

return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])

211

return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])

212

213

return lowerencode

213

return lowerencode

214

215

216

lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()

216

lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()

217

218

# Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9

218

# Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9

219

_winres3 = (b'aux', b'con', b'prn', b'nul') # length 3

219

_winres3 = (b'aux', b'con', b'prn', b'nul') # length 3

220

_winres4 = (b'com', b'lpt') # length 4 (with trailing 1..9)

220

_winres4 = (b'com', b'lpt') # length 4 (with trailing 1..9)

221

222

223

def _auxencode(path, dotencode):

223

def _auxencode(path, dotencode):

224

"""

224

"""

225

Encodes filenames containing names reserved by Windows or which end in

225

Encodes filenames containing names reserved by Windows or which end in

226

period or space. Does not touch other single reserved characters c.

226

period or space. Does not touch other single reserved characters c.

227

Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.

227

Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.

228

Additionally encodes space or period at the beginning, if dotencode is

228

Additionally encodes space or period at the beginning, if dotencode is

229

True. Parameter path is assumed to be all lowercase.

229

True. Parameter path is assumed to be all lowercase.

230

A segment only needs encoding if a reserved name appears as a

230

A segment only needs encoding if a reserved name appears as a

231

basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"

231

basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"

232

doesn't need encoding.

232

doesn't need encoding.

233

234

>>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'

234

>>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'

235

>>> _auxencode(s.split(b'/'), True)

235

>>> _auxencode(s.split(b'/'), True)

236

['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']

236

['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']

237

>>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'

237

>>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'

238

>>> _auxencode(s.split(b'/'), False)

238

>>> _auxencode(s.split(b'/'), False)

239

['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']

239

['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']

240

>>> _auxencode([b'foo. '], True)

240

>>> _auxencode([b'foo. '], True)

241

['foo.~20']

241

['foo.~20']

242

>>> _auxencode([b' .foo'], True)

242

>>> _auxencode([b' .foo'], True)

243

['~20.foo']

243

['~20.foo']

244

"""

244

"""

245

for i, n in enumerate(path):

245

for i, n in enumerate(path):

246

if not n:

246

if not n:

247

continue

247

continue

248

if dotencode and n[0] in b'. ':

248

if dotencode and n[0] in b'. ':

249

n = b"~%02x" % ord(n[0:1]) + n[1:]

249

n = b"~%02x" % ord(n[0:1]) + n[1:]

250

path[i] = n

250

path[i] = n

251

else:

251

else:

252

l = n.find(b'.')

252

l = n.find(b'.')

253

if l == -1:

253

if l == -1:

254

l = len(n)

254

l = len(n)

255

if (l == 3 and n[:3] in _winres3) or (

255

if (l == 3 and n[:3] in _winres3) or (

256

l == 4

256

l == 4

257

and n[3:4] <= b'9'

257

and n[3:4] <= b'9'

258

and n[3:4] >= b'1'

258

and n[3:4] >= b'1'

259

and n[:3] in _winres4

259

and n[:3] in _winres4

260

):

260

):

261

# encode third letter ('aux' -> 'au~78')

261

# encode third letter ('aux' -> 'au~78')

262

ec = b"~%02x" % ord(n[2:3])

262

ec = b"~%02x" % ord(n[2:3])

263

n = n[0:2] + ec + n[3:]

263

n = n[0:2] + ec + n[3:]

264

path[i] = n

264

path[i] = n

265

if n[-1] in b'. ':

265

if n[-1] in b'. ':

266

# encode last period or space ('foo...' -> 'foo..~2e')

266

# encode last period or space ('foo...' -> 'foo..~2e')

267

path[i] = n[:-1] + b"~%02x" % ord(n[-1:])

267

path[i] = n[:-1] + b"~%02x" % ord(n[-1:])

268

return path

268

return path

269

270

271

_maxstorepathlen = 120

271

_maxstorepathlen = 120

272

_dirprefixlen = 8

272

_dirprefixlen = 8

273

_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4

273

_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4

274

275

276

def _hashencode(path, dotencode):

276

def _hashencode(path, dotencode):

277

digest = hex(hashutil.sha1(path).digest())

277

digest = hex(hashutil.sha1(path).digest())

278

le = lowerencode(path[5:]).split(b'/') # skips prefix 'data/' or 'meta/'

278

le = lowerencode(path[5:]).split(b'/') # skips prefix 'data/' or 'meta/'

279

parts = _auxencode(le, dotencode)

279

parts = _auxencode(le, dotencode)

280

basename = parts[-1]

280

basename = parts[-1]

281

_root, ext = os.path.splitext(basename)

281

_root, ext = os.path.splitext(basename)

282

sdirs = []

282

sdirs = []

283

sdirslen = 0

283

sdirslen = 0

284

for p in parts[:-1]:

284

for p in parts[:-1]:

285

d = p[:_dirprefixlen]

285

d = p[:_dirprefixlen]

286

if d[-1] in b'. ':

286

if d[-1] in b'. ':

287

# Windows can't access dirs ending in period or space

287

# Windows can't access dirs ending in period or space

288

d = d[:-1] + b'_'

288

d = d[:-1] + b'_'

289

if sdirslen == 0:

289

if sdirslen == 0:

290

t = len(d)

290

t = len(d)

291

else:

291

else:

292

t = sdirslen + 1 + len(d)

292

t = sdirslen + 1 + len(d)

293

if t > _maxshortdirslen:

293

if t > _maxshortdirslen:

294

break

294

break

295

sdirs.append(d)

295

sdirs.append(d)

296

sdirslen = t

296

sdirslen = t

297

dirs = b'/'.join(sdirs)

297

dirs = b'/'.join(sdirs)

298

if len(dirs) > 0:

298

if len(dirs) > 0:

299

dirs += b'/'

299

dirs += b'/'

300

res = b'dh/' + dirs + digest + ext

300

res = b'dh/' + dirs + digest + ext

301

spaceleft = _maxstorepathlen - len(res)

301

spaceleft = _maxstorepathlen - len(res)

302

if spaceleft > 0:

302

if spaceleft > 0:

303

filler = basename[:spaceleft]

303

filler = basename[:spaceleft]

304

res = b'dh/' + dirs + filler + digest + ext

304

res = b'dh/' + dirs + filler + digest + ext

305

return res

305

return res

306

307

308

def _hybridencode(path, dotencode):

308

def _hybridencode(path, dotencode):

309

"""encodes path with a length limit

309

"""encodes path with a length limit

310

311

Encodes all paths that begin with 'data/', according to the following.

311

Encodes all paths that begin with 'data/', according to the following.

312

313

Default encoding (reversible):

313

Default encoding (reversible):

314

315

Encodes all uppercase letters 'X' as '_x'. All reserved or illegal

315

Encodes all uppercase letters 'X' as '_x'. All reserved or illegal

316

characters are encoded as '~xx', where xx is the two digit hex code

316

characters are encoded as '~xx', where xx is the two digit hex code

317

of the character (see encodefilename).

317

of the character (see encodefilename).

318

Relevant path components consisting of Windows reserved filenames are

318

Relevant path components consisting of Windows reserved filenames are

319

masked by encoding the third character ('aux' -> 'au~78', see _auxencode).

319

masked by encoding the third character ('aux' -> 'au~78', see _auxencode).

320

321

Hashed encoding (not reversible):

321

Hashed encoding (not reversible):

322

323

If the default-encoded path is longer than _maxstorepathlen, a

323

If the default-encoded path is longer than _maxstorepathlen, a

324

non-reversible hybrid hashing of the path is done instead.

324

non-reversible hybrid hashing of the path is done instead.

325

This encoding uses up to _dirprefixlen characters of all directory

325

This encoding uses up to _dirprefixlen characters of all directory

326

levels of the lowerencoded path, but not more levels than can fit into

326

levels of the lowerencoded path, but not more levels than can fit into

327

_maxshortdirslen.

327

_maxshortdirslen.

328

Then follows the filler followed by the sha digest of the full path.

328

Then follows the filler followed by the sha digest of the full path.

329

The filler is the beginning of the basename of the lowerencoded path

329

The filler is the beginning of the basename of the lowerencoded path

330

(the basename is everything after the last path separator). The filler

330

(the basename is everything after the last path separator). The filler

331

is as long as possible, filling in characters from the basename until

331

is as long as possible, filling in characters from the basename until

332

the encoded path has _maxstorepathlen characters (or all chars of the

332

the encoded path has _maxstorepathlen characters (or all chars of the

333

basename have been taken).

333

basename have been taken).

334

The extension (e.g. '.i' or '.d') is preserved.

334

The extension (e.g. '.i' or '.d') is preserved.

335

336

The string 'data/' at the beginning is replaced with 'dh/', if the hashed

336

The string 'data/' at the beginning is replaced with 'dh/', if the hashed

337

encoding was used.

337

encoding was used.

338

"""

338

"""

339

path = encodedir(path)

339

path = encodedir(path)

340

ef = _encodefname(path).split(b'/')

340

ef = _encodefname(path).split(b'/')

341

res = b'/'.join(_auxencode(ef, dotencode))

341

res = b'/'.join(_auxencode(ef, dotencode))

342

if len(res) > _maxstorepathlen:

342

if len(res) > _maxstorepathlen:

343

res = _hashencode(path, dotencode)

343

res = _hashencode(path, dotencode)

344

return res

344

return res

345

346

347

def _pathencode(path):

347

def _pathencode(path):

348

de = encodedir(path)

348

de = encodedir(path)

349

if len(path) > _maxstorepathlen:

349

if len(path) > _maxstorepathlen:

350

return _hashencode(de, True)

350

return _hashencode(de, True)

351

ef = _encodefname(de).split(b'/')

351

ef = _encodefname(de).split(b'/')

352

res = b'/'.join(_auxencode(ef, True))

352

res = b'/'.join(_auxencode(ef, True))

353

if len(res) > _maxstorepathlen:

353

if len(res) > _maxstorepathlen:

354

return _hashencode(de, True)

354

return _hashencode(de, True)

355

return res

355

return res

356

357

358

_pathencode = getattr(parsers, 'pathencode', _pathencode)

358

_pathencode = getattr(parsers, 'pathencode', _pathencode)

359

360

361

def _plainhybridencode(f):

361

def _plainhybridencode(f):

362

return _hybridencode(f, False)

362

return _hybridencode(f, False)

363

364

365

def _calcmode(vfs):

365

def _calcmode(vfs):

366

try:

366

try:

367

# files in .hg/ will be created using this mode

367

# files in .hg/ will be created using this mode

368

mode = vfs.stat().st_mode

368

mode = vfs.stat().st_mode

369

# avoid some useless chmods

369

# avoid some useless chmods

370

if (0o777 & ~util.umask) == (0o777 & mode):

370

if (0o777 & ~util.umask) == (0o777 & mode):

371

mode = None

371

mode = None

372

except OSError:

372

except OSError:

373

mode = None

373

mode = None

374

return mode

374

return mode

375

376

377

_data = [

377

_data = [

378

b'bookmarks',

378

b'bookmarks',

379

b'narrowspec',

379

b'narrowspec',

380

b'data',

380

b'data',

381

b'meta',

381

b'meta',

382

b'00manifest.d',

382

b'00manifest.d',

383

b'00manifest.i',

383

b'00manifest.i',

384

b'00changelog.d',

384

b'00changelog.d',

385

b'00changelog.i',

385

b'00changelog.i',

386

b'phaseroots',

386

b'phaseroots',

387

b'obsstore',

387

b'obsstore',

388

b'requires',

388

b'requires',

389

]

389

]

390

391

REVLOG_FILES_MAIN_EXT = (b'.i', b'i.tmpcensored')

391

REVLOG_FILES_MAIN_EXT = (b'.i', b'i.tmpcensored')

392

REVLOG_FILES_OTHER_EXT = (

392

REVLOG_FILES_OTHER_EXT = (

393

b'.idx',

393

b'.idx',

394

b'.d',

394

b'.d',

395

b'.dat',

395

b'.dat',

396

b'.n',

396

b'.n',

397

b'.nd',

397

b'.nd',

398

b'.sda',

398

b'.sda',

399

b'd.tmpcensored',

399

b'd.tmpcensored',

400

)

400

)

401

# files that are "volatile" and might change between listing and streaming

401

# files that are "volatile" and might change between listing and streaming

402

#

402

#

403

# note: the ".nd" file are nodemap data and won't "change" but they might be

403

# note: the ".nd" file are nodemap data and won't "change" but they might be

404

# deleted.

404

# deleted.

405

REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')

405

REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')

406

407

# some exception to the above matching

407

# some exception to the above matching

408

#

408

#

409

# XXX This is currently not in use because of issue6542

409

# XXX This is currently not in use because of issue6542

410

EXCLUDED = re.compile(b'.*undo\.[^/]+\.(nd?|i)$')

410

EXCLUDED = re.compile(b'.*undo\.[^/]+\.(nd?|i)$')

411

412

413

def is_revlog(f, kind, st):

413

def is_revlog(f, kind, st):

414

if kind != stat.S_IFREG:

414

if kind != stat.S_IFREG:

415

return None

415

return None

416

return revlog_type(f)

416

return revlog_type(f)

417

418

419

def revlog_type(f):

419

def revlog_type(f):

420

# XXX we need to filter `undo.` created by the transaction here, however

420

# XXX we need to filter `undo.` created by the transaction here, however

421

# being naive about it also filter revlog for `undo.*` files, leading to

421

# being naive about it also filter revlog for `undo.*` files, leading to

422

# issue6542. So we no longer use EXCLUDED.

422

# issue6542. So we no longer use EXCLUDED.

423

if f.endswith(REVLOG_FILES_MAIN_EXT):

423

if f.endswith(REVLOG_FILES_MAIN_EXT):

424

return FILEFLAGS_REVLOG_MAIN

424

return FILEFLAGS_REVLOG_MAIN

425

elif f.endswith(REVLOG_FILES_OTHER_EXT):

425

elif f.endswith(REVLOG_FILES_OTHER_EXT):

426

t = FILETYPE_FILELOG_OTHER

426

t = FILETYPE_FILELOG_OTHER

427

if f.endswith(REVLOG_FILES_VOLATILE_EXT):

427

if f.endswith(REVLOG_FILES_VOLATILE_EXT):

428

t |= FILEFLAGS_VOLATILE

428

t |= FILEFLAGS_VOLATILE

429

return t

429

return t

430

return None

430

return None

431

432

433

# the file is part of changelog data

433

# the file is part of changelog data

434

FILEFLAGS_CHANGELOG = 1 << 13

434

FILEFLAGS_CHANGELOG = 1 << 13

435

# the file is part of manifest data

435

# the file is part of manifest data

436

FILEFLAGS_MANIFESTLOG = 1 << 12

436

FILEFLAGS_MANIFESTLOG = 1 << 12

437

# the file is part of filelog data

437

# the file is part of filelog data

438

FILEFLAGS_FILELOG = 1 << 11

438

FILEFLAGS_FILELOG = 1 << 11

439

# file that are not directly part of a revlog

439

# file that are not directly part of a revlog

440

FILEFLAGS_OTHER = 1 << 10

440

FILEFLAGS_OTHER = 1 << 10

441

442

# the main entry point for a revlog

442

# the main entry point for a revlog

443

FILEFLAGS_REVLOG_MAIN = 1 << 1

443

FILEFLAGS_REVLOG_MAIN = 1 << 1

444

# a secondary file for a revlog

444

# a secondary file for a revlog

445

FILEFLAGS_REVLOG_OTHER = 1 << 0

445

FILEFLAGS_REVLOG_OTHER = 1 << 0

446

447

# files that are "volatile" and might change between listing and streaming

447

# files that are "volatile" and might change between listing and streaming

448

FILEFLAGS_VOLATILE = 1 << 20

448

FILEFLAGS_VOLATILE = 1 << 20

449

450

FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN

450

FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN

451

FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER

451

FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER

452

FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN

452

FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN

453

FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER

453

FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER

454

FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN

454

FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN

455

FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER

455

FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER

456

FILETYPE_OTHER = FILEFLAGS_OTHER

456

FILETYPE_OTHER = FILEFLAGS_OTHER

457

458

459

class basicstore(object):

459

class basicstore(object):

460

'''base class for local repository stores'''

460

'''base class for local repository stores'''

461

462

def __init__(self, path, vfstype):

462

def __init__(self, path, vfstype):

463

vfs = vfstype(path)

463

vfs = vfstype(path)

464

self.path = vfs.base

464

self.path = vfs.base

465

self.createmode = _calcmode(vfs)

465

self.createmode = _calcmode(vfs)

466

vfs.createmode = self.createmode

466

vfs.createmode = self.createmode

467

self.rawvfs = vfs

467

self.rawvfs = vfs

468

self.vfs = vfsmod.filtervfs(vfs, encodedir)

468

self.vfs = vfsmod.filtervfs(vfs, encodedir)

469

self.opener = self.vfs

469

self.opener = self.vfs

470

471

def join(self, f):

471

def join(self, f):

472

return self.path + b'/' + encodedir(f)

472

return self.path + b'/' + encodedir(f)

473

474

def _walk(self, relpath, recurse):

474

def _walk(self, relpath, recurse):

475

'''yields (unencoded, encoded, size)'''

475

'''yields (unencoded, encoded, size)'''

476

path = self.path

476

path = self.path

477

if relpath:

477

if relpath:

478

path += b'/' + relpath

478

path += b'/' + relpath

479

striplen = len(self.path) + 1

479

striplen = len(self.path) + 1

480

l = []

480

l = []

481

if self.rawvfs.isdir(path):

481

if self.rawvfs.isdir(path):

482

visit = [path]

482

visit = [path]

483

readdir = self.rawvfs.readdir

483

readdir = self.rawvfs.readdir

484

while visit:

484

while visit:

485

p = visit.pop()

485

p = visit.pop()

486

for f, kind, st in readdir(p, stat=True):

486

for f, kind, st in readdir(p, stat=True):

487

fp = p + b'/' + f

487

fp = p + b'/' + f

488

rl_type = is_revlog(f, kind, st)

488

rl_type = is_revlog(f, kind, st)

489

if rl_type is not None:

489

if rl_type is not None:

490

n = util.pconvert(fp[striplen:])

490

n = util.pconvert(fp[striplen:])

491

l.append((rl_type, decodedir(n), n, st.st_size))

491

l.append((rl_type, decodedir(n), n, st.st_size))

492

elif kind == stat.S_IFDIR and recurse:

492

elif kind == stat.S_IFDIR and recurse:

493

visit.append(fp)

493

visit.append(fp)

494

l.sort()

494

l.sort()

495

return l

495

return l

496

497

def changelog(self, trypending, concurrencychecker=None):

497

def changelog(self, trypending, concurrencychecker=None):

498

return changelog.changelog(

498

return changelog.changelog(

499

self.vfs,

499

self.vfs,

500

trypending=trypending,

500

trypending=trypending,

501

concurrencychecker=concurrencychecker,

501

concurrencychecker=concurrencychecker,

502

)

502

)

503

504

def manifestlog(self, repo, storenarrowmatch):

504

def manifestlog(self, repo, storenarrowmatch):

505

rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)

505

rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)

506

return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)

506

return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)

507

508

def datafiles(self, matcher=None):

508

def datafiles(self, matcher=None):

509

files = self._walk(b'data', True) + self._walk(b'meta', True)

509

files = self._walk(b'data', True) + self._walk(b'meta', True)

510

for (t, u, e, s) in files:

510

for (t, u, e, s) in files:

511

yield (FILEFLAGS_FILELOG | t, u, e, s)

511

yield (FILEFLAGS_FILELOG | t, u, e, s)

512

513

def topfiles(self):

513

def topfiles(self):

514

# yield manifest before changelog

514

# yield manifest before changelog

515

files = reversed(self._walk(b'', False))

515

files = reversed(self._walk(b'', False))

516

for (t, u, e, s) in files:

516

for (t, u, e, s) in files:

517

if u.startswith(b'00changelog'):

517

if u.startswith(b'00changelog'):

518

yield (FILEFLAGS_CHANGELOG | t, u, e, s)

518

yield (FILEFLAGS_CHANGELOG | t, u, e, s)

519

elif u.startswith(b'00manifest'):

519

elif u.startswith(b'00manifest'):

520

yield (FILEFLAGS_MANIFESTLOG | t, u, e, s)

520

yield (FILEFLAGS_MANIFESTLOG | t, u, e, s)

521

else:

521

else:

522

yield (FILETYPE_OTHER | t, u, e, s)

522

yield (FILETYPE_OTHER | t, u, e, s)

523

524

def walk(self, matcher=None):

524

def walk(self, matcher=None):

525

"""return file related to data storage (ie: revlogs)

525

"""return file related to data storage (ie: revlogs)

526

527

yields (file_type, unencoded, encoded, size)

527

yields (file_type, unencoded, encoded, size)

528

529

if a matcher is passed, storage files of only those tracked paths

529

if a matcher is passed, storage files of only those tracked paths

530

are passed with matches the matcher

530

are passed with matches the matcher

531

"""

531

"""

532

# yield data files first

532

# yield data files first

533

for x in self.datafiles(matcher):

533

for x in self.datafiles(matcher):

534

yield x

534

yield x

535

for x in self.topfiles():

535

for x in self.topfiles():

536

yield x

536

yield x

537

538

def copylist(self):

538

def copylist(self):

539

return _data

539

return _data

540

541

def write(self, tr):

541

def write(self, tr):

542

pass

542

pass

543

544

def invalidatecaches(self):

544

def invalidatecaches(self):

545

pass

545

pass

546

547

def markremoved(self, fn):

547

def markremoved(self, fn):

548

pass

548

pass

549

550

def __contains__(self, path):

550

def __contains__(self, path):

551

'''Checks if the store contains path'''

551

'''Checks if the store contains path'''

552

path = b"/".join((b"data", path))

552

path = b"/".join((b"data", path))

553

# file?

553

# file?

554

if self.vfs.exists(path + b".i"):

554

if self.vfs.exists(path + b".i"):

555

return True

555

return True

556

# dir?

556

# dir?

557

if not path.endswith(b"/"):

557

if not path.endswith(b"/"):

558

path = path + b"/"

558

path = path + b"/"

559

return self.vfs.exists(path)

559

return self.vfs.exists(path)

560

561

562

class encodedstore(basicstore):

562

class encodedstore(basicstore):

563

def __init__(self, path, vfstype):

563

def __init__(self, path, vfstype):

564

vfs = vfstype(path + b'/store')

564

vfs = vfstype(path + b'/store')

565

self.path = vfs.base

565

self.path = vfs.base

566

self.createmode = _calcmode(vfs)

566

self.createmode = _calcmode(vfs)

567

vfs.createmode = self.createmode

567

vfs.createmode = self.createmode

568

self.rawvfs = vfs

568

self.rawvfs = vfs

569

self.vfs = vfsmod.filtervfs(vfs, encodefilename)

569

self.vfs = vfsmod.filtervfs(vfs, encodefilename)

570

self.opener = self.vfs

570

self.opener = self.vfs

571

572

# note: topfiles would also need a decode phase. It is just that in

573

# practice we do not have any file outside of `data/` that needs encoding.

574

# However that might change so we should probably add a test and encoding

575

# decoding for it too. see issue6548

576

572

def datafiles(self, matcher=None):

577

def datafiles(self, matcher=None):

573

for t, a, b, size in super(encodedstore, self).datafiles():

578

for t, a, b, size in super(encodedstore, self).datafiles():

574

try:

579

try:

575

a = decodefilename(a)

580

a = decodefilename(a)

576

except KeyError:

581

except KeyError:

577

a = None

582

a = None

578

if a is not None and not _matchtrackedpath(a, matcher):

583

if a is not None and not _matchtrackedpath(a, matcher):

579

continue

584

continue

580

yield t, a, b, size

585

yield t, a, b, size

581

586

582

def join(self, f):

587

def join(self, f):

583

return self.path + b'/' + encodefilename(f)

588

return self.path + b'/' + encodefilename(f)

584

589

585

def copylist(self):

590

def copylist(self):

586

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]

591

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]

587

592

588

593

589

class fncache(object):

594

class fncache(object):

590

# the filename used to be partially encoded

595

# the filename used to be partially encoded

591

# hence the encodedir/decodedir dance

596

# hence the encodedir/decodedir dance

592

def __init__(self, vfs):

597

def __init__(self, vfs):

593

self.vfs = vfs

598

self.vfs = vfs

594

self.entries = None

599

self.entries = None

595

self._dirty = False

600

self._dirty = False

596

# set of new additions to fncache

601

# set of new additions to fncache

597

self.addls = set()

602

self.addls = set()

598

603

599

def ensureloaded(self, warn=None):

604

def ensureloaded(self, warn=None):

600

"""read the fncache file if not already read.

605

"""read the fncache file if not already read.

601

606

602

If the file on disk is corrupted, raise. If warn is provided,

607

If the file on disk is corrupted, raise. If warn is provided,

603

warn and keep going instead."""

608

warn and keep going instead."""

604

if self.entries is None:

609

if self.entries is None:

605

self._load(warn)

610

self._load(warn)

606

611

607

def _load(self, warn=None):

612

def _load(self, warn=None):

608

'''fill the entries from the fncache file'''

613

'''fill the entries from the fncache file'''

609

self._dirty = False

614

self._dirty = False

610

try:

615

try:

611

fp = self.vfs(b'fncache', mode=b'rb')

616

fp = self.vfs(b'fncache', mode=b'rb')

612

except IOError:

617

except IOError:

613

# skip nonexistent file

618

# skip nonexistent file

614

self.entries = set()

619

self.entries = set()

615

return

620

return

616

621

617

self.entries = set()

622

self.entries = set()

618

chunk = b''

623

chunk = b''

619

for c in iter(functools.partial(fp.read, fncache_chunksize), b''):

624

for c in iter(functools.partial(fp.read, fncache_chunksize), b''):

620

chunk += c

625

chunk += c

621

try:

626

try:

622

p = chunk.rindex(b'\n')

627

p = chunk.rindex(b'\n')

623

self.entries.update(decodedir(chunk[: p + 1]).splitlines())

628

self.entries.update(decodedir(chunk[: p + 1]).splitlines())

624

chunk = chunk[p + 1 :]

629

chunk = chunk[p + 1 :]

625

except ValueError:

630

except ValueError:

626

# substring '\n' not found, maybe the entry is bigger than the

631

# substring '\n' not found, maybe the entry is bigger than the

627

# chunksize, so let's keep iterating

632

# chunksize, so let's keep iterating

628

pass

633

pass

629

634

630

if chunk:

635

if chunk:

631

msg = _(b"fncache does not ends with a newline")

636

msg = _(b"fncache does not ends with a newline")

632

if warn:

637

if warn:

633

warn(msg + b'\n')

638

warn(msg + b'\n')

634

else:

639

else:

635

raise error.Abort(

640

raise error.Abort(

636

msg,

641

msg,

637

hint=_(

642

hint=_(

638

b"use 'hg debugrebuildfncache' to "

643

b"use 'hg debugrebuildfncache' to "

639

b"rebuild the fncache"

644

b"rebuild the fncache"

640

),

645

),

641

)

646

)

642

self._checkentries(fp, warn)

647

self._checkentries(fp, warn)

643

fp.close()

648

fp.close()

644

649

645

def _checkentries(self, fp, warn):

650

def _checkentries(self, fp, warn):

646

"""make sure there is no empty string in entries"""

651

"""make sure there is no empty string in entries"""

647

if b'' in self.entries:

652

if b'' in self.entries:

648

fp.seek(0)

653

fp.seek(0)

649

for n, line in enumerate(util.iterfile(fp)):

654

for n, line in enumerate(util.iterfile(fp)):

650

if not line.rstrip(b'\n'):

655

if not line.rstrip(b'\n'):

651

t = _(b'invalid entry in fncache, line %d') % (n + 1)

656

t = _(b'invalid entry in fncache, line %d') % (n + 1)

652

if warn:

657

if warn:

653

warn(t + b'\n')

658

warn(t + b'\n')

654

else:

659

else:

655

raise error.Abort(t)

660

raise error.Abort(t)

656

661

657

def write(self, tr):

662

def write(self, tr):

658

if self._dirty:

663

if self._dirty:

659

assert self.entries is not None

664

assert self.entries is not None

660

self.entries = self.entries | self.addls

665

self.entries = self.entries | self.addls

661

self.addls = set()

666

self.addls = set()

662

tr.addbackup(b'fncache')

667

tr.addbackup(b'fncache')

663

fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)

668

fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)

664

if self.entries:

669

if self.entries:

665

fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))

670

fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))

666

fp.close()

671

fp.close()

667

self._dirty = False

672

self._dirty = False

668

if self.addls:

673

if self.addls:

669

# if we have just new entries, let's append them to the fncache

674

# if we have just new entries, let's append them to the fncache

670

tr.addbackup(b'fncache')

675

tr.addbackup(b'fncache')

671

fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)

676

fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)

672

if self.addls:

677

if self.addls:

673

fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))

678

fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))

674

fp.close()

679

fp.close()

675

self.entries = None

680

self.entries = None

676

self.addls = set()

681

self.addls = set()

677

682

678

def add(self, fn):

683

def add(self, fn):

679

if self.entries is None:

684

if self.entries is None:

680

self._load()

685

self._load()

681

if fn not in self.entries:

686

if fn not in self.entries:

682

self.addls.add(fn)

687

self.addls.add(fn)

683

688

684

def remove(self, fn):

689

def remove(self, fn):

685

if self.entries is None:

690

if self.entries is None:

686

self._load()

691

self._load()

687

if fn in self.addls:

692

if fn in self.addls:

688

self.addls.remove(fn)

693

self.addls.remove(fn)

689

return

694

return

690

try:

695

try:

691

self.entries.remove(fn)

696

self.entries.remove(fn)

692

self._dirty = True

697

self._dirty = True

693

except KeyError:

698

except KeyError:

694

pass

699

pass

695

700

696

def __contains__(self, fn):

701

def __contains__(self, fn):

697

if fn in self.addls:

702

if fn in self.addls:

698

return True

703

return True

699

if self.entries is None:

704

if self.entries is None:

700

self._load()

705

self._load()

701

return fn in self.entries

706

return fn in self.entries

702

707

703

def __iter__(self):

708

def __iter__(self):

704

if self.entries is None:

709

if self.entries is None:

705

self._load()

710

self._load()

706

return iter(self.entries | self.addls)

711

return iter(self.entries | self.addls)

707

712

708

713

709

class _fncachevfs(vfsmod.proxyvfs):

714

class _fncachevfs(vfsmod.proxyvfs):

710

def __init__(self, vfs, fnc, encode):

715

def __init__(self, vfs, fnc, encode):

711

vfsmod.proxyvfs.__init__(self, vfs)

716

vfsmod.proxyvfs.__init__(self, vfs)

712

self.fncache = fnc

717

self.fncache = fnc

713

self.encode = encode

718

self.encode = encode

714

719

715

def __call__(self, path, mode=b'r', *args, **kw):

720

def __call__(self, path, mode=b'r', *args, **kw):

716

encoded = self.encode(path)

721

encoded = self.encode(path)

717

if mode not in (b'r', b'rb') and (

722

if mode not in (b'r', b'rb') and (

718

path.startswith(b'data/') or path.startswith(b'meta/')

723

path.startswith(b'data/') or path.startswith(b'meta/')

719

):

724

):

720

# do not trigger a fncache load when adding a file that already is

725

# do not trigger a fncache load when adding a file that already is

721

# known to exist.

726

# known to exist.

722

notload = self.fncache.entries is None and self.vfs.exists(encoded)

727

notload = self.fncache.entries is None and self.vfs.exists(encoded)

723

if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:

728

if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:

724

# when appending to an existing file, if the file has size zero,

729

# when appending to an existing file, if the file has size zero,

725

# it should be considered as missing. Such zero-size files are

730

# it should be considered as missing. Such zero-size files are

726

# the result of truncation when a transaction is aborted.

731

# the result of truncation when a transaction is aborted.

727

notload = False

732

notload = False

728

if not notload:

733

if not notload:

729

self.fncache.add(path)

734

self.fncache.add(path)

730

return self.vfs(encoded, mode, *args, **kw)

735

return self.vfs(encoded, mode, *args, **kw)

731

736

732

def join(self, path):

737

def join(self, path):

733

if path:

738

if path:

734

return self.vfs.join(self.encode(path))

739

return self.vfs.join(self.encode(path))

735

else:

740

else:

736

return self.vfs.join(path)

741

return self.vfs.join(path)

737

742

738

def register_file(self, path):

743

def register_file(self, path):

739

"""generic hook point to lets fncache steer its stew"""

744

"""generic hook point to lets fncache steer its stew"""

740

if path.startswith(b'data/') or path.startswith(b'meta/'):

745

if path.startswith(b'data/') or path.startswith(b'meta/'):

741

self.fncache.add(path)

746

self.fncache.add(path)

742

747

743

748

744

class fncachestore(basicstore):

749

class fncachestore(basicstore):

745

def __init__(self, path, vfstype, dotencode):

750

def __init__(self, path, vfstype, dotencode):

746

if dotencode:

751

if dotencode:

747

encode = _pathencode

752

encode = _pathencode

748

else:

753

else:

749

encode = _plainhybridencode

754

encode = _plainhybridencode

750

self.encode = encode

755

self.encode = encode

751

vfs = vfstype(path + b'/store')

756

vfs = vfstype(path + b'/store')

752

self.path = vfs.base

757

self.path = vfs.base

753

self.pathsep = self.path + b'/'

758

self.pathsep = self.path + b'/'

754

self.createmode = _calcmode(vfs)

759

self.createmode = _calcmode(vfs)

755

vfs.createmode = self.createmode

760

vfs.createmode = self.createmode

756

self.rawvfs = vfs

761

self.rawvfs = vfs

757

fnc = fncache(vfs)

762

fnc = fncache(vfs)

758

self.fncache = fnc

763

self.fncache = fnc

759

self.vfs = _fncachevfs(vfs, fnc, encode)

764

self.vfs = _fncachevfs(vfs, fnc, encode)

760

self.opener = self.vfs

765

self.opener = self.vfs

761

766

762

def join(self, f):

767

def join(self, f):

763

return self.pathsep + self.encode(f)

768

return self.pathsep + self.encode(f)

764

769

765

def getsize(self, path):

770

def getsize(self, path):

766

return self.rawvfs.stat(path).st_size

771

return self.rawvfs.stat(path).st_size

767

772

768

def datafiles(self, matcher=None):

773

def datafiles(self, matcher=None):

769

for f in sorted(self.fncache):

774

for f in sorted(self.fncache):

770

if not _matchtrackedpath(f, matcher):

775

if not _matchtrackedpath(f, matcher):

771

continue

776

continue

772

ef = self.encode(f)

777

ef = self.encode(f)

773

try:

778

try:

774

t = revlog_type(f)

779

t = revlog_type(f)

775

assert t is not None, f

780

assert t is not None, f

776

t |= FILEFLAGS_FILELOG

781

t |= FILEFLAGS_FILELOG

777

yield t, f, ef, self.getsize(ef)

782

yield t, f, ef, self.getsize(ef)

778

except OSError as err:

783

except OSError as err:

779

if err.errno != errno.ENOENT:

784

if err.errno != errno.ENOENT:

780

raise

785

raise

781

786

782

def copylist(self):

787

def copylist(self):

783

d = (

788

d = (

784

b'bookmarks',

789

b'bookmarks',

785

b'narrowspec',

790

b'narrowspec',

786

b'data',

791

b'data',

787

b'meta',

792

b'meta',

788

b'dh',

793

b'dh',

789

b'fncache',

794

b'fncache',

790

b'phaseroots',

795

b'phaseroots',

791

b'obsstore',

796

b'obsstore',

792

b'00manifest.d',

797

b'00manifest.d',

793

b'00manifest.i',

798

b'00manifest.i',

794

b'00changelog.d',

799

b'00changelog.d',

795

b'00changelog.i',

800

b'00changelog.i',

796

b'requires',

801

b'requires',

797

)

802

)

798

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]

803

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]

799

804

800

def write(self, tr):

805

def write(self, tr):

801

self.fncache.write(tr)

806

self.fncache.write(tr)

802

807

803

def invalidatecaches(self):

808

def invalidatecaches(self):

804

self.fncache.entries = None

809

self.fncache.entries = None

805

self.fncache.addls = set()

810

self.fncache.addls = set()

806

811

807

def markremoved(self, fn):

812

def markremoved(self, fn):

808

self.fncache.remove(fn)

813

self.fncache.remove(fn)

809

814

810

def _exists(self, f):

815

def _exists(self, f):

811

ef = self.encode(f)

816

ef = self.encode(f)

812

try:

817

try:

813

self.getsize(ef)

818

self.getsize(ef)

814

return True

819

return True

815

except OSError as err:

820

except OSError as err:

816

if err.errno != errno.ENOENT:

821

if err.errno != errno.ENOENT:

817

raise

822

raise

818

# nonexistent entry

823

# nonexistent entry

819

return False

824

return False

820

825

821

def __contains__(self, path):

826

def __contains__(self, path):

822

'''Checks if the store contains path'''

827

'''Checks if the store contains path'''

823

path = b"/".join((b"data", path))

828

path = b"/".join((b"data", path))

824

# check for files (exact match)

829

# check for files (exact match)

825

e = path + b'.i'

830

e = path + b'.i'

826

if e in self.fncache and self._exists(e):

831

if e in self.fncache and self._exists(e):

827

return True

832

return True

828

# now check for directories (prefix match)

833

# now check for directories (prefix match)

829

if not path.endswith(b'/'):

834

if not path.endswith(b'/'):

830

path += b'/'

835

path += b'/'

831

for e in self.fncache:

836

for e in self.fncache:

832

if e.startswith(path) and self._exists(e):

837

if e.startswith(path) and self._exists(e):

833

return True

838

return True

834

return False

839

return False

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # store.py - repository store handling for Mercurial
             #
             # Copyright 2008 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import errno
             import functools
             import os
             import re
             import stat
             from .i18n import _
             from .pycompat import getattr
             from .node import hex
             from . import (
                 changelog,
                 error,
                 manifest,
                 policy,
                 pycompat,
                 util,
                 vfs as vfsmod,
             )
             from .utils import hashutil
             parsers = policy.importmod('parsers')
             # how much bytes should be read from fncache in one read
             # It is done to prevent loading large fncache files into memory
             fncache_chunksize = 10 ** 6
             def _matchtrackedpath(path, matcher):
                 """parses a fncache entry and returns whether the entry is tracking a path
                 matched by matcher or not.
                 If matcher is None, returns True"""
                 if matcher is None:
                     return True
                 path = decodedir(path)
                 if path.startswith(b'data/'):
                     return matcher(path[len(b'data/') : -len(b'.i')])
                 elif path.startswith(b'meta/'):
                     return matcher.visitdir(path[len(b'meta/') : -len(b'/00manifest.i')])
                 raise error.ProgrammingError(b"cannot decode path %s" % path)
             # This avoids a collision between a file named foo and a dir named
             # foo.i or foo.d
             def _encodedir(path):
                 """
                 >>> _encodedir(b'data/foo.i')
                 'data/foo.i'
                 >>> _encodedir(b'data/foo.i/bla.i')
                 'data/foo.i.hg/bla.i'
                 >>> _encodedir(b'data/foo.i.hg/bla.i')
                 'data/foo.i.hg.hg/bla.i'
                 >>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')
                 'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'
                 """
                 return (
                     path.replace(b".hg/", b".hg.hg/")
                     .replace(b".i/", b".i.hg/")
                     .replace(b".d/", b".d.hg/")
                 )
             encodedir = getattr(parsers, 'encodedir', _encodedir)
             def decodedir(path):
                 """
                 >>> decodedir(b'data/foo.i')
                 'data/foo.i'
                 >>> decodedir(b'data/foo.i.hg/bla.i')
                 'data/foo.i/bla.i'
                 >>> decodedir(b'data/foo.i.hg.hg/bla.i')
                 'data/foo.i.hg/bla.i'
                 """
                 if b".hg/" not in path:
                     return path
                 return (
                     path.replace(b".d.hg/", b".d/")
                     .replace(b".i.hg/", b".i/")
                     .replace(b".hg.hg/", b".hg/")
                 )
             def _reserved():
                 """characters that are problematic for filesystems
                 * ascii escapes (0..31)
                 * ascii hi (126..255)
                 * windows specials
                 these characters will be escaped by encodefunctions
                 """
                 winreserved = [ord(x) for x in u'\\:*?"<>|']
                 for x in range(32):
                     yield x
                 for x in range(126, 256):
                     yield x
                 for x in winreserved:
                     yield x
             def _buildencodefun():
                 """
                 >>> enc, dec = _buildencodefun()
                 >>> enc(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> dec(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> enc(b'HELLO')
                 '_h_e_l_l_o'
                 >>> dec(b'_h_e_l_l_o')
                 'HELLO'
                 >>> enc(b'hello:world?')
                 'hello~3aworld~3f'
                 >>> dec(b'hello~3aworld~3f')
                 'hello:world?'
                 >>> enc(b'the\\x07quick\\xADshot')
                 'the~07quick~adshot'
                 >>> dec(b'the~07quick~adshot')
                 'the\\x07quick\\xadshot'
                 """
                 e = b'_'
                 xchr = pycompat.bytechr
                 asciistr = list(map(xchr, range(127)))
                 capitals = list(range(ord(b"A"), ord(b"Z") + 1))
                 cmap = {x: x for x in asciistr}
                 for x in _reserved():
                     cmap[xchr(x)] = b"~%02x" % x
                 for x in capitals + [ord(e)]:
                     cmap[xchr(x)] = e + xchr(x).lower()
                 dmap = {}
                 for k, v in pycompat.iteritems(cmap):
                     dmap[v] = k
                 def decode(s):
                     i = 0
                     while i < len(s):
                         for l in pycompat.xrange(1, 4):
                             try:
                                 yield dmap[s[i : i + l]]
                                 i += l
                                 break
                             except KeyError:
                                 pass
                         else:
                             raise KeyError
                 return (
                     lambda s: b''.join(
                         [cmap[s[c : c + 1]] for c in pycompat.xrange(len(s))]
                     ),
                     lambda s: b''.join(list(decode(s))),
                 )
             _encodefname, _decodefname = _buildencodefun()
             def encodefilename(s):
                 """
                 >>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')
                 'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'
                 """
                 return _encodefname(encodedir(s))
             def decodefilename(s):
                 """
                 >>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')
                 'foo.i/bar.d/bla.hg/hi:world?/HELLO'
                 """
                 return decodedir(_decodefname(s))
             def _buildlowerencodefun():
                 """
                 >>> f = _buildlowerencodefun()
                 >>> f(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> f(b'HELLO')
                 'hello'
                 >>> f(b'hello:world?')
                 'hello~3aworld~3f'
                 >>> f(b'the\\x07quick\\xADshot')
                 'the~07quick~adshot'
                 """
                 xchr = pycompat.bytechr
                 cmap = {xchr(x): xchr(x) for x in pycompat.xrange(127)}
                 for x in _reserved():
                     cmap[xchr(x)] = b"~%02x" % x
                 for x in range(ord(b"A"), ord(b"Z") + 1):
                     cmap[xchr(x)] = xchr(x).lower()
                 def lowerencode(s):
                     return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])
                 return lowerencode
             lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()
             # Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9
             _winres3 = (b'aux', b'con', b'prn', b'nul')  # length 3
             _winres4 = (b'com', b'lpt')  # length 4 (with trailing 1..9)
             def _auxencode(path, dotencode):
                 """
                 Encodes filenames containing names reserved by Windows or which end in
                 period or space. Does not touch other single reserved characters c.
                 Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.
                 Additionally encodes space or period at the beginning, if dotencode is
                 True. Parameter path is assumed to be all lowercase.
                 A segment only needs encoding if a reserved name appears as a
                 basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"
                 doesn't need encoding.
                 >>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'
                 >>> _auxencode(s.split(b'/'), True)
                 ['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']
                 >>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'
                 >>> _auxencode(s.split(b'/'), False)
                 ['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']
                 >>> _auxencode([b'foo. '], True)
                 ['foo.~20']
                 >>> _auxencode([b' .foo'], True)
                 ['~20.foo']
                 """
                 for i, n in enumerate(path):
                     if not n:
                         continue
                     if dotencode and n[0] in b'. ':
                         n = b"~%02x" % ord(n[0:1]) + n[1:]
                         path[i] = n
                     else:
                         l = n.find(b'.')
                         if l == -1:
                             l = len(n)
                         if (l == 3 and n[:3] in _winres3) or (
                             l == 4
                             and n[3:4] <= b'9'
                             and n[3:4] >= b'1'
                             and n[:3] in _winres4
                         ):
                             # encode third letter ('aux' -> 'au~78')
                             ec = b"~%02x" % ord(n[2:3])
                             n = n[0:2] + ec + n[3:]
                             path[i] = n
                     if n[-1] in b'. ':
                         # encode last period or space ('foo...' -> 'foo..~2e')
                         path[i] = n[:-1] + b"~%02x" % ord(n[-1:])
                 return path
             _maxstorepathlen = 120
             _dirprefixlen = 8
             _maxshortdirslen = 8 * (_dirprefixlen + 1) - 4
             def _hashencode(path, dotencode):
                 digest = hex(hashutil.sha1(path).digest())
                 le = lowerencode(path[5:]).split(b'/')  # skips prefix 'data/' or 'meta/'
                 parts = _auxencode(le, dotencode)
                 basename = parts[-1]
                 _root, ext = os.path.splitext(basename)
                 sdirs = []
                 sdirslen = 0
                 for p in parts[:-1]:
                     d = p[:_dirprefixlen]
                     if d[-1] in b'. ':
                         # Windows can't access dirs ending in period or space
                         d = d[:-1] + b'_'
                     if sdirslen == 0:
                         t = len(d)
                     else:
                         t = sdirslen + 1 + len(d)
                         if t > _maxshortdirslen:
                             break
                     sdirs.append(d)
                     sdirslen = t
                 dirs = b'/'.join(sdirs)
                 if len(dirs) > 0:
                     dirs += b'/'
                 res = b'dh/' + dirs + digest + ext
                 spaceleft = _maxstorepathlen - len(res)
                 if spaceleft > 0:
                     filler = basename[:spaceleft]
                     res = b'dh/' + dirs + filler + digest + ext
                 return res
             def _hybridencode(path, dotencode):
                 """encodes path with a length limit
                 Encodes all paths that begin with 'data/', according to the following.
                 Default encoding (reversible):
                 Encodes all uppercase letters 'X' as '_x'. All reserved or illegal
                 characters are encoded as '~xx', where xx is the two digit hex code
                 of the character (see encodefilename).
                 Relevant path components consisting of Windows reserved filenames are
                 masked by encoding the third character ('aux' -> 'au~78', see _auxencode).
                 Hashed encoding (not reversible):
                 If the default-encoded path is longer than _maxstorepathlen, a
                 non-reversible hybrid hashing of the path is done instead.
                 This encoding uses up to _dirprefixlen characters of all directory
                 levels of the lowerencoded path, but not more levels than can fit into
                 _maxshortdirslen.
                 Then follows the filler followed by the sha digest of the full path.
                 The filler is the beginning of the basename of the lowerencoded path
                 (the basename is everything after the last path separator). The filler
                 is as long as possible, filling in characters from the basename until
                 the encoded path has _maxstorepathlen characters (or all chars of the
                 basename have been taken).
                 The extension (e.g. '.i' or '.d') is preserved.
                 The string 'data/' at the beginning is replaced with 'dh/', if the hashed
                 encoding was used.
                 """
                 path = encodedir(path)
                 ef = _encodefname(path).split(b'/')
                 res = b'/'.join(_auxencode(ef, dotencode))
                 if len(res) > _maxstorepathlen:
                     res = _hashencode(path, dotencode)
                 return res
             def _pathencode(path):
                 de = encodedir(path)
                 if len(path) > _maxstorepathlen:
                     return _hashencode(de, True)
                 ef = _encodefname(de).split(b'/')
                 res = b'/'.join(_auxencode(ef, True))
                 if len(res) > _maxstorepathlen:
                     return _hashencode(de, True)
                 return res
             _pathencode = getattr(parsers, 'pathencode', _pathencode)
             def _plainhybridencode(f):
                 return _hybridencode(f, False)
             def _calcmode(vfs):
                 try:
                     # files in .hg/ will be created using this mode
                     mode = vfs.stat().st_mode
                     # avoid some useless chmods
                     if (0o777 & ~util.umask) == (0o777 & mode):
                         mode = None
                 except OSError:
                     mode = None
                 return mode
             _data = [
                 b'bookmarks',
                 b'narrowspec',
                 b'data',
                 b'meta',
                 b'00manifest.d',
                 b'00manifest.i',
                 b'00changelog.d',
                 b'00changelog.i',
                 b'phaseroots',
                 b'obsstore',
                 b'requires',
             ]
             REVLOG_FILES_MAIN_EXT = (b'.i', b'i.tmpcensored')
             REVLOG_FILES_OTHER_EXT = (
                 b'.idx',
                 b'.d',
                 b'.dat',
                 b'.n',
                 b'.nd',
                 b'.sda',
                 b'd.tmpcensored',
             )
             # files that are "volatile" and might change between listing and streaming
             #
             # note: the ".nd" file are nodemap data and won't "change" but they might be
             # deleted.
             REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')
             # some exception to the above matching
             #
             # XXX This is currently not in use because of issue6542
             EXCLUDED = re.compile(b'.*undo\.[^/]+\.(nd?|i)$')
             def is_revlog(f, kind, st):
                 if kind != stat.S_IFREG:
                     return None
                 return revlog_type(f)
             def revlog_type(f):
                 # XXX we need to filter `undo.` created by the transaction here, however
                 # being naive about it also filter revlog for `undo.*` files, leading to
                 # issue6542. So we no longer use EXCLUDED.
                 if f.endswith(REVLOG_FILES_MAIN_EXT):
                     return FILEFLAGS_REVLOG_MAIN
                 elif f.endswith(REVLOG_FILES_OTHER_EXT):
                     t = FILETYPE_FILELOG_OTHER
                     if f.endswith(REVLOG_FILES_VOLATILE_EXT):
                         t |= FILEFLAGS_VOLATILE
                     return t
                 return None
             # the file is part of changelog data
             FILEFLAGS_CHANGELOG = 1 << 13
             # the file is part of manifest data
             FILEFLAGS_MANIFESTLOG = 1 << 12
             # the file is part of filelog data
             FILEFLAGS_FILELOG = 1 << 11
             # file that are not directly part of a revlog
             FILEFLAGS_OTHER = 1 << 10
             # the main entry point for a revlog
             FILEFLAGS_REVLOG_MAIN = 1 << 1
             # a secondary file for a revlog
             FILEFLAGS_REVLOG_OTHER = 1 << 0
             # files that are "volatile" and might change between listing and streaming
             FILEFLAGS_VOLATILE = 1 << 20
             FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN
             FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER
             FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN
             FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER
             FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN
             FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER
             FILETYPE_OTHER = FILEFLAGS_OTHER
             class basicstore(object):
                 '''base class for local repository stores'''
                 def __init__(self, path, vfstype):
                     vfs = vfstype(path)
                     self.path = vfs.base
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     self.vfs = vfsmod.filtervfs(vfs, encodedir)
                     self.opener = self.vfs
                 def join(self, f):
                     return self.path + b'/' + encodedir(f)
                 def _walk(self, relpath, recurse):
                     '''yields (unencoded, encoded, size)'''
                     path = self.path
                     if relpath:
                         path += b'/' + relpath
                     striplen = len(self.path) + 1
                     l = []
                     if self.rawvfs.isdir(path):
                         visit = [path]
                         readdir = self.rawvfs.readdir
                         while visit:
                             p = visit.pop()
                             for f, kind, st in readdir(p, stat=True):
                                 fp = p + b'/' + f
                                 rl_type = is_revlog(f, kind, st)
                                 if rl_type is not None:
                                     n = util.pconvert(fp[striplen:])
                                     l.append((rl_type, decodedir(n), n, st.st_size))
                                 elif kind == stat.S_IFDIR and recurse:
                                     visit.append(fp)
                     l.sort()
                     return l
                 def changelog(self, trypending, concurrencychecker=None):
                     return changelog.changelog(
                         self.vfs,
                         trypending=trypending,
                         concurrencychecker=concurrencychecker,
                     )
                 def manifestlog(self, repo, storenarrowmatch):
                     rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)
                     return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)
                 def datafiles(self, matcher=None):
                     files = self._walk(b'data', True) + self._walk(b'meta', True)
                     for (t, u, e, s) in files:
                         yield (FILEFLAGS_FILELOG | t, u, e, s)
                 def topfiles(self):
                     # yield manifest before changelog
                     files = reversed(self._walk(b'', False))
                     for (t, u, e, s) in files:
                         if u.startswith(b'00changelog'):
                             yield (FILEFLAGS_CHANGELOG | t, u, e, s)
                         elif u.startswith(b'00manifest'):
                             yield (FILEFLAGS_MANIFESTLOG | t, u, e, s)
                         else:
                             yield (FILETYPE_OTHER | t, u, e, s)
                 def walk(self, matcher=None):
                     """return file related to data storage (ie: revlogs)
                     yields (file_type, unencoded, encoded, size)
                     if a matcher is passed, storage files of only those tracked paths
                     are passed with matches the matcher
                     """
                     # yield data files first
                     for x in self.datafiles(matcher):
                         yield x
                     for x in self.topfiles():
                         yield x
                 def copylist(self):
                     return _data
                 def write(self, tr):
                     pass
                 def invalidatecaches(self):
                     pass
                 def markremoved(self, fn):
                     pass
                 def __contains__(self, path):
                     '''Checks if the store contains path'''
                     path = b"/".join((b"data", path))
                     # file?
                     if self.vfs.exists(path + b".i"):
                         return True
                     # dir?
                     if not path.endswith(b"/"):
                         path = path + b"/"
                     return self.vfs.exists(path)
             class encodedstore(basicstore):
                 def __init__(self, path, vfstype):
                     vfs = vfstype(path + b'/store')
                     self.path = vfs.base
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     self.vfs = vfsmod.filtervfs(vfs, encodefilename)
                     self.opener = self.vfs
+                # note: topfiles would also need a decode phase. It is just that in
+                # practice we do not have any file outside of `data/` that needs encoding.
+                # However that might change so we should probably add a test and encoding
+                # decoding for it too. see issue6548
                 def datafiles(self, matcher=None):
                     for t, a, b, size in super(encodedstore, self).datafiles():
                         try:
                             a = decodefilename(a)
                         except KeyError:
                             a = None
                         if a is not None and not _matchtrackedpath(a, matcher):
                             continue
                         yield t, a, b, size
                 def join(self, f):
                     return self.path + b'/' + encodefilename(f)
                 def copylist(self):
                     return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]
             class fncache(object):
                 # the filename used to be partially encoded
                 # hence the encodedir/decodedir dance
                 def __init__(self, vfs):
                     self.vfs = vfs
                     self.entries = None
                     self._dirty = False
                     # set of new additions to fncache
                     self.addls = set()
                 def ensureloaded(self, warn=None):
                     """read the fncache file if not already read.
                     If the file on disk is corrupted, raise. If warn is provided,
                     warn and keep going instead."""
                     if self.entries is None:
                         self._load(warn)
                 def _load(self, warn=None):
                     '''fill the entries from the fncache file'''
                     self._dirty = False
                     try:
                         fp = self.vfs(b'fncache', mode=b'rb')
                     except IOError:
                         # skip nonexistent file
                         self.entries = set()
                         return
                     self.entries = set()
                     chunk = b''
                     for c in iter(functools.partial(fp.read, fncache_chunksize), b''):
                         chunk += c
                         try:
                             p = chunk.rindex(b'\n')
                             self.entries.update(decodedir(chunk[: p + 1]).splitlines())
                             chunk = chunk[p + 1 :]
                         except ValueError:
                             # substring '\n' not found, maybe the entry is bigger than the
                             # chunksize, so let's keep iterating
                             pass
                     if chunk:
                         msg = _(b"fncache does not ends with a newline")
                         if warn:
                             warn(msg + b'\n')
                         else:
                             raise error.Abort(
                                 msg,
                                 hint=_(
                                     b"use 'hg debugrebuildfncache' to "
                                     b"rebuild the fncache"
                                 ),
                             )
                     self._checkentries(fp, warn)
                     fp.close()
                 def _checkentries(self, fp, warn):
                     """make sure there is no empty string in entries"""
                     if b'' in self.entries:
                         fp.seek(0)
                         for n, line in enumerate(util.iterfile(fp)):
                             if not line.rstrip(b'\n'):
                                 t = _(b'invalid entry in fncache, line %d') % (n + 1)
                                 if warn:
                                     warn(t + b'\n')
                                 else:
                                     raise error.Abort(t)
                 def write(self, tr):
                     if self._dirty:
                         assert self.entries is not None
                         self.entries = self.entries | self.addls
                         self.addls = set()
                         tr.addbackup(b'fncache')
                         fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)
                         if self.entries:
                             fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))
                         fp.close()
                         self._dirty = False
                     if self.addls:
                         # if we have just new entries, let's append them to the fncache
                         tr.addbackup(b'fncache')
                         fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)
                         if self.addls:
                             fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))
                         fp.close()
                         self.entries = None
                         self.addls = set()
                 def add(self, fn):
                     if self.entries is None:
                         self._load()
                     if fn not in self.entries:
                         self.addls.add(fn)
                 def remove(self, fn):
                     if self.entries is None:
                         self._load()
                     if fn in self.addls:
                         self.addls.remove(fn)
                         return
                     try:
                         self.entries.remove(fn)
                         self._dirty = True
                     except KeyError:
                         pass
                 def __contains__(self, fn):
                     if fn in self.addls:
                         return True
                     if self.entries is None:
                         self._load()
                     return fn in self.entries
                 def __iter__(self):
                     if self.entries is None:
                         self._load()
                     return iter(self.entries | self.addls)
             class _fncachevfs(vfsmod.proxyvfs):
                 def __init__(self, vfs, fnc, encode):
                     vfsmod.proxyvfs.__init__(self, vfs)
                     self.fncache = fnc
                     self.encode = encode
                 def __call__(self, path, mode=b'r', *args, **kw):
                     encoded = self.encode(path)
                     if mode not in (b'r', b'rb') and (
                         path.startswith(b'data/') or path.startswith(b'meta/')
                     ):
                         # do not trigger a fncache load when adding a file that already is
                         # known to exist.
                         notload = self.fncache.entries is None and self.vfs.exists(encoded)
                         if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:
                             # when appending to an existing file, if the file has size zero,
                             # it should be considered as missing. Such zero-size files are
                             # the result of truncation when a transaction is aborted.
                             notload = False
                         if not notload:
                             self.fncache.add(path)
                     return self.vfs(encoded, mode, *args, **kw)
                 def join(self, path):
                     if path:
                         return self.vfs.join(self.encode(path))
                     else:
                         return self.vfs.join(path)
                 def register_file(self, path):
                     """generic hook point to lets fncache steer its stew"""
                     if path.startswith(b'data/') or path.startswith(b'meta/'):
                         self.fncache.add(path)
             class fncachestore(basicstore):
                 def __init__(self, path, vfstype, dotencode):
                     if dotencode:
                         encode = _pathencode
                     else:
                         encode = _plainhybridencode
                     self.encode = encode
                     vfs = vfstype(path + b'/store')
                     self.path = vfs.base
                     self.pathsep = self.path + b'/'
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     fnc = fncache(vfs)
                     self.fncache = fnc
                     self.vfs = _fncachevfs(vfs, fnc, encode)
                     self.opener = self.vfs
                 def join(self, f):
                     return self.pathsep + self.encode(f)
                 def getsize(self, path):
                     return self.rawvfs.stat(path).st_size
                 def datafiles(self, matcher=None):
                     for f in sorted(self.fncache):
                         if not _matchtrackedpath(f, matcher):
                             continue
                         ef = self.encode(f)
                         try:
                             t = revlog_type(f)
                             assert t is not None, f
                             t |= FILEFLAGS_FILELOG
                             yield t, f, ef, self.getsize(ef)
                         except OSError as err:
                             if err.errno != errno.ENOENT:
                                 raise
                 def copylist(self):
                     d = (
                         b'bookmarks',
                         b'narrowspec',
                         b'data',
                         b'meta',
                         b'dh',
                         b'fncache',
                         b'phaseroots',
                         b'obsstore',
                         b'00manifest.d',
                         b'00manifest.i',
                         b'00changelog.d',
                         b'00changelog.i',
                         b'requires',
                     )
                     return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]
                 def write(self, tr):
                     self.fncache.write(tr)
                 def invalidatecaches(self):
                     self.fncache.entries = None
                     self.fncache.addls = set()
                 def markremoved(self, fn):
                     self.fncache.remove(fn)
                 def _exists(self, f):
                     ef = self.encode(f)
                     try:
                         self.getsize(ef)
                         return True
                     except OSError as err:
                         if err.errno != errno.ENOENT:
                             raise
                         # nonexistent entry
                         return False
                 def __contains__(self, path):
                     '''Checks if the store contains path'''
                     path = b"/".join((b"data", path))
                     # check for files (exact match)
                     e = path + b'.i'
                     if e in self.fncache and self._exists(e):
                         return True
                     # now check for directories (prefix match)
                     if not path.endswith(b'/'):
                         path += b'/'
                     for e in self.fncache:
                         if e.startswith(path) and self._exists(e):
                             return True
                     return False