upstream/mercurial-mirror Commit - r51573:e324329f

1

# store.py - repository store handling for Mercurial

1

# store.py - repository store handling for Mercurial)

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

import collections

8

import collections

9

import functools

9

import functools

10

import os

10

import os

11

import re

11

import re

12

import stat

12

import stat

13

from typing import Generator, List

13

from typing import Generator, List

14

15

from .i18n import _

15

from .i18n import _

16

from .pycompat import getattr

16

from .pycompat import getattr

17

from .thirdparty import attr

17

from .thirdparty import attr

18

from .node import hex

18

from .node import hex

19

from .revlogutils.constants import (

19

from .revlogutils.constants import (

20

INDEX_HEADER,

20

INDEX_HEADER,

21

KIND_CHANGELOG,

22

KIND_FILELOG,

23

KIND_MANIFESTLOG,

21

)

24

)

22

from . import (

25

from . import (

23

changelog,

26

changelog,

24

error,

27

error,

25

filelog,

28

filelog,

26

manifest,

29

manifest,

27

policy,

30

policy,

28

pycompat,

31

pycompat,

29

revlog as revlogmod,

32

revlog as revlogmod,

30

util,

33

util,

31

vfs as vfsmod,

34

vfs as vfsmod,

32

)

35

)

33

from .utils import hashutil

36

from .utils import hashutil

34

37

35

parsers = policy.importmod('parsers')

38

parsers = policy.importmod('parsers')

36

# how much bytes should be read from fncache in one read

39

# how much bytes should be read from fncache in one read

37

# It is done to prevent loading large fncache files into memory

40

# It is done to prevent loading large fncache files into memory

38

fncache_chunksize = 10 ** 6

41

fncache_chunksize = 10 ** 6

39

42

40

43

41

def _match_tracked_entry(entry, matcher):

44

def _match_tracked_entry(entry, matcher):

42

"""parses a fncache entry and returns whether the entry is tracking a path

45

"""parses a fncache entry and returns whether the entry is tracking a path

43

matched by matcher or not.

46

matched by matcher or not.

44

47

45

If matcher is None, returns True"""

48

If matcher is None, returns True"""

46

49

47

if matcher is None:

50

if matcher is None:

48

return True

51

return True

49

if entry.is_filelog:

52

if entry.is_filelog:

50

return matcher(entry.target_id)

53

return matcher(entry.target_id)

51

elif entry.is_manifestlog:

54

elif entry.is_manifestlog:

52

return matcher.visitdir(entry.target_id.rstrip(b'/'))

55

return matcher.visitdir(entry.target_id.rstrip(b'/'))

53

raise error.ProgrammingError(b"cannot process entry %r" % entry)

56

raise error.ProgrammingError(b"cannot process entry %r" % entry)

54

57

55

58

56

# This avoids a collision between a file named foo and a dir named

59

# This avoids a collision between a file named foo and a dir named

57

# foo.i or foo.d

60

# foo.i or foo.d

58

def _encodedir(path):

61

def _encodedir(path):

59

"""

62

"""

60

>>> _encodedir(b'data/foo.i')

63

>>> _encodedir(b'data/foo.i')

61

'data/foo.i'

64

'data/foo.i'

62

>>> _encodedir(b'data/foo.i/bla.i')

65

>>> _encodedir(b'data/foo.i/bla.i')

63

'data/foo.i.hg/bla.i'

66

'data/foo.i.hg/bla.i'

64

>>> _encodedir(b'data/foo.i.hg/bla.i')

67

>>> _encodedir(b'data/foo.i.hg/bla.i')

65

'data/foo.i.hg.hg/bla.i'

68

'data/foo.i.hg.hg/bla.i'

66

>>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')

69

>>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')

67

'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'

70

'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'

68

"""

71

"""

69

return (

72

return (

70

path.replace(b".hg/", b".hg.hg/")

73

path.replace(b".hg/", b".hg.hg/")

71

.replace(b".i/", b".i.hg/")

74

.replace(b".i/", b".i.hg/")

72

.replace(b".d/", b".d.hg/")

75

.replace(b".d/", b".d.hg/")

73

)

76

)

74

77

75

78

76

encodedir = getattr(parsers, 'encodedir', _encodedir)

79

encodedir = getattr(parsers, 'encodedir', _encodedir)

77

80

78

81

79

def decodedir(path):

82

def decodedir(path):

80

"""

83

"""

81

>>> decodedir(b'data/foo.i')

84

>>> decodedir(b'data/foo.i')

82

'data/foo.i'

85

'data/foo.i'

83

>>> decodedir(b'data/foo.i.hg/bla.i')

86

>>> decodedir(b'data/foo.i.hg/bla.i')

84

'data/foo.i/bla.i'

87

'data/foo.i/bla.i'

85

>>> decodedir(b'data/foo.i.hg.hg/bla.i')

88

>>> decodedir(b'data/foo.i.hg.hg/bla.i')

86

'data/foo.i.hg/bla.i'

89

'data/foo.i.hg/bla.i'

87

"""

90

"""

88

if b".hg/" not in path:

91

if b".hg/" not in path:

89

return path

92

return path

90

return (

93

return (

91

path.replace(b".d.hg/", b".d/")

94

path.replace(b".d.hg/", b".d/")

92

.replace(b".i.hg/", b".i/")

95

.replace(b".i.hg/", b".i/")

93

.replace(b".hg.hg/", b".hg/")

96

.replace(b".hg.hg/", b".hg/")

94

)

97

)

95

98

96

99

97

def _reserved():

100

def _reserved():

98

"""characters that are problematic for filesystems

101

"""characters that are problematic for filesystems

99

102

100

* ascii escapes (0..31)

103

* ascii escapes (0..31)

101

* ascii hi (126..255)

104

* ascii hi (126..255)

102

* windows specials

105

* windows specials

103

106

104

these characters will be escaped by encodefunctions

107

these characters will be escaped by encodefunctions

105

"""

108

"""

106

winreserved = [ord(x) for x in u'\\:*?"<>|']

109

winreserved = [ord(x) for x in u'\\:*?"<>|']

107

for x in range(32):

110

for x in range(32):

108

yield x

111

yield x

109

for x in range(126, 256):

112

for x in range(126, 256):

110

yield x

113

yield x

111

for x in winreserved:

114

for x in winreserved:

112

yield x

115

yield x

113

116

114

117

115

def _buildencodefun():

118

def _buildencodefun():

116

"""

119

"""

117

>>> enc, dec = _buildencodefun()

120

>>> enc, dec = _buildencodefun()

118

121

119

>>> enc(b'nothing/special.txt')

122

>>> enc(b'nothing/special.txt')

120

'nothing/special.txt'

123

'nothing/special.txt'

121

>>> dec(b'nothing/special.txt')

124

>>> dec(b'nothing/special.txt')

122

'nothing/special.txt'

125

'nothing/special.txt'

123

126

124

>>> enc(b'HELLO')

127

>>> enc(b'HELLO')

125

'_h_e_l_l_o'

128

'_h_e_l_l_o'

126

>>> dec(b'_h_e_l_l_o')

129

>>> dec(b'_h_e_l_l_o')

127

'HELLO'

130

'HELLO'

128

131

129

>>> enc(b'hello:world?')

132

>>> enc(b'hello:world?')

130

'hello~3aworld~3f'

133

'hello~3aworld~3f'

131

>>> dec(b'hello~3aworld~3f')

134

>>> dec(b'hello~3aworld~3f')

132

'hello:world?'

135

'hello:world?'

133

136

134

>>> enc(b'the\\x07quick\\xADshot')

137

>>> enc(b'the\\x07quick\\xADshot')

135

'the~07quick~adshot'

138

'the~07quick~adshot'

136

>>> dec(b'the~07quick~adshot')

139

>>> dec(b'the~07quick~adshot')

137

'the\\x07quick\\xadshot'

140

'the\\x07quick\\xadshot'

138

"""

141

"""

139

e = b'_'

142

e = b'_'

140

xchr = pycompat.bytechr

143

xchr = pycompat.bytechr

141

asciistr = list(map(xchr, range(127)))

144

asciistr = list(map(xchr, range(127)))

142

capitals = list(range(ord(b"A"), ord(b"Z") + 1))

145

capitals = list(range(ord(b"A"), ord(b"Z") + 1))

143

146

144

cmap = {x: x for x in asciistr}

147

cmap = {x: x for x in asciistr}

145

for x in _reserved():

148

for x in _reserved():

146

cmap[xchr(x)] = b"~%02x" % x

149

cmap[xchr(x)] = b"~%02x" % x

147

for x in capitals + [ord(e)]:

150

for x in capitals + [ord(e)]:

148

cmap[xchr(x)] = e + xchr(x).lower()

151

cmap[xchr(x)] = e + xchr(x).lower()

149

152

150

dmap = {}

153

dmap = {}

151

for k, v in cmap.items():

154

for k, v in cmap.items():

152

dmap[v] = k

155

dmap[v] = k

153

156

154

def decode(s):

157

def decode(s):

155

i = 0

158

i = 0

156

while i < len(s):

159

while i < len(s):

157

for l in range(1, 4):

160

for l in range(1, 4):

158

try:

161

try:

159

yield dmap[s[i : i + l]]

162

yield dmap[s[i : i + l]]

160

i += l

163

i += l

161

break

164

break

162

except KeyError:

165

except KeyError:

163

pass

166

pass

164

else:

167

else:

165

raise KeyError

168

raise KeyError

166

169

167

return (

170

return (

168

lambda s: b''.join([cmap[s[c : c + 1]] for c in range(len(s))]),

171

lambda s: b''.join([cmap[s[c : c + 1]] for c in range(len(s))]),

169

lambda s: b''.join(list(decode(s))),

172

lambda s: b''.join(list(decode(s))),

170

)

173

)

171

174

172

175

173

_encodefname, _decodefname = _buildencodefun()

176

_encodefname, _decodefname = _buildencodefun()

174

177

175

178

176

def encodefilename(s):

179

def encodefilename(s):

177

"""

180

"""

178

>>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')

181

>>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')

179

'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'

182

'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'

180

"""

183

"""

181

return _encodefname(encodedir(s))

184

return _encodefname(encodedir(s))

182

185

183

186

184

def decodefilename(s):

187

def decodefilename(s):

185

"""

188

"""

186

>>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')

189

>>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')

187

'foo.i/bar.d/bla.hg/hi:world?/HELLO'

190

'foo.i/bar.d/bla.hg/hi:world?/HELLO'

188

"""

191

"""

189

return decodedir(_decodefname(s))

192

return decodedir(_decodefname(s))

190

193

191

194

192

def _buildlowerencodefun():

195

def _buildlowerencodefun():

193

"""

196

"""

194

>>> f = _buildlowerencodefun()

197

>>> f = _buildlowerencodefun()

195

>>> f(b'nothing/special.txt')

198

>>> f(b'nothing/special.txt')

196

'nothing/special.txt'

199

'nothing/special.txt'

197

>>> f(b'HELLO')

200

>>> f(b'HELLO')

198

'hello'

201

'hello'

199

>>> f(b'hello:world?')

202

>>> f(b'hello:world?')

200

'hello~3aworld~3f'

203

'hello~3aworld~3f'

201

>>> f(b'the\\x07quick\\xADshot')

204

>>> f(b'the\\x07quick\\xADshot')

202

'the~07quick~adshot'

205

'the~07quick~adshot'

203

"""

206

"""

204

xchr = pycompat.bytechr

207

xchr = pycompat.bytechr

205

cmap = {xchr(x): xchr(x) for x in range(127)}

208

cmap = {xchr(x): xchr(x) for x in range(127)}

206

for x in _reserved():

209

for x in _reserved():

207

cmap[xchr(x)] = b"~%02x" % x

210

cmap[xchr(x)] = b"~%02x" % x

208

for x in range(ord(b"A"), ord(b"Z") + 1):

211

for x in range(ord(b"A"), ord(b"Z") + 1):

209

cmap[xchr(x)] = xchr(x).lower()

212

cmap[xchr(x)] = xchr(x).lower()

210

213

211

def lowerencode(s):

214

def lowerencode(s):

212

return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])

215

return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])

213

216

214

return lowerencode

217

return lowerencode

215

218

216

219

217

lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()

220

lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()

218

221

219

# Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9

222

# Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9

220

_winres3 = (b'aux', b'con', b'prn', b'nul') # length 3

223

_winres3 = (b'aux', b'con', b'prn', b'nul') # length 3

221

_winres4 = (b'com', b'lpt') # length 4 (with trailing 1..9)

224

_winres4 = (b'com', b'lpt') # length 4 (with trailing 1..9)

222

225

223

226

224

def _auxencode(path, dotencode):

227

def _auxencode(path, dotencode):

225

"""

228

"""

226

Encodes filenames containing names reserved by Windows or which end in

229

Encodes filenames containing names reserved by Windows or which end in

227

period or space. Does not touch other single reserved characters c.

230

period or space. Does not touch other single reserved characters c.

228

Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.

231

Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.

229

Additionally encodes space or period at the beginning, if dotencode is

232

Additionally encodes space or period at the beginning, if dotencode is

230

True. Parameter path is assumed to be all lowercase.

233

True. Parameter path is assumed to be all lowercase.

231

A segment only needs encoding if a reserved name appears as a

234

A segment only needs encoding if a reserved name appears as a

232

basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"

235

basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"

233

doesn't need encoding.

236

doesn't need encoding.

234

237

235

>>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'

238

>>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'

236

>>> _auxencode(s.split(b'/'), True)

239

>>> _auxencode(s.split(b'/'), True)

237

['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']

240

['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']

238

>>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'

241

>>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'

239

>>> _auxencode(s.split(b'/'), False)

242

>>> _auxencode(s.split(b'/'), False)

240

['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']

243

['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']

241

>>> _auxencode([b'foo. '], True)

244

>>> _auxencode([b'foo. '], True)

242

['foo.~20']

245

['foo.~20']

243

>>> _auxencode([b' .foo'], True)

246

>>> _auxencode([b' .foo'], True)

244

['~20.foo']

247

['~20.foo']

245

"""

248

"""

246

for i, n in enumerate(path):

249

for i, n in enumerate(path):

247

if not n:

250

if not n:

248

continue

251

continue

249

if dotencode and n[0] in b'. ':

252

if dotencode and n[0] in b'. ':

250

n = b"~%02x" % ord(n[0:1]) + n[1:]

253

n = b"~%02x" % ord(n[0:1]) + n[1:]

251

path[i] = n

254

path[i] = n

252

else:

255

else:

253

l = n.find(b'.')

256

l = n.find(b'.')

254

if l == -1:

257

if l == -1:

255

l = len(n)

258

l = len(n)

256

if (l == 3 and n[:3] in _winres3) or (

259

if (l == 3 and n[:3] in _winres3) or (

257

l == 4

260

l == 4

258

and n[3:4] <= b'9'

261

and n[3:4] <= b'9'

259

and n[3:4] >= b'1'

262

and n[3:4] >= b'1'

260

and n[:3] in _winres4

263

and n[:3] in _winres4

261

):

264

):

262

# encode third letter ('aux' -> 'au~78')

265

# encode third letter ('aux' -> 'au~78')

263

ec = b"~%02x" % ord(n[2:3])

266

ec = b"~%02x" % ord(n[2:3])

264

n = n[0:2] + ec + n[3:]

267

n = n[0:2] + ec + n[3:]

265

path[i] = n

268

path[i] = n

266

if n[-1] in b'. ':

269

if n[-1] in b'. ':

267

# encode last period or space ('foo...' -> 'foo..~2e')

270

# encode last period or space ('foo...' -> 'foo..~2e')

268

path[i] = n[:-1] + b"~%02x" % ord(n[-1:])

271

path[i] = n[:-1] + b"~%02x" % ord(n[-1:])

269

return path

272

return path

270

273

271

274

272

_maxstorepathlen = 120

275

_maxstorepathlen = 120

273

_dirprefixlen = 8

276

_dirprefixlen = 8

274

_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4

277

_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4

275

278

276

279

277

def _hashencode(path, dotencode):

280

def _hashencode(path, dotencode):

278

digest = hex(hashutil.sha1(path).digest())

281

digest = hex(hashutil.sha1(path).digest())

279

le = lowerencode(path[5:]).split(b'/') # skips prefix 'data/' or 'meta/'

282

le = lowerencode(path[5:]).split(b'/') # skips prefix 'data/' or 'meta/'

280

parts = _auxencode(le, dotencode)

283

parts = _auxencode(le, dotencode)

281

basename = parts[-1]

284

basename = parts[-1]

282

_root, ext = os.path.splitext(basename)

285

_root, ext = os.path.splitext(basename)

283

sdirs = []

286

sdirs = []

284

sdirslen = 0

287

sdirslen = 0

285

for p in parts[:-1]:

288

for p in parts[:-1]:

286

d = p[:_dirprefixlen]

289

d = p[:_dirprefixlen]

287

if d[-1] in b'. ':

290

if d[-1] in b'. ':

288

# Windows can't access dirs ending in period or space

291

# Windows can't access dirs ending in period or space

289

d = d[:-1] + b'_'

292

d = d[:-1] + b'_'

290

if sdirslen == 0:

293

if sdirslen == 0:

291

t = len(d)

294

t = len(d)

292

else:

295

else:

293

t = sdirslen + 1 + len(d)

296

t = sdirslen + 1 + len(d)

294

if t > _maxshortdirslen:

297

if t > _maxshortdirslen:

295

break

298

break

296

sdirs.append(d)

299

sdirs.append(d)

297

sdirslen = t

300

sdirslen = t

298

dirs = b'/'.join(sdirs)

301

dirs = b'/'.join(sdirs)

299

if len(dirs) > 0:

302

if len(dirs) > 0:

300

dirs += b'/'

303

dirs += b'/'

301

res = b'dh/' + dirs + digest + ext

304

res = b'dh/' + dirs + digest + ext

302

spaceleft = _maxstorepathlen - len(res)

305

spaceleft = _maxstorepathlen - len(res)

303

if spaceleft > 0:

306

if spaceleft > 0:

304

filler = basename[:spaceleft]

307

filler = basename[:spaceleft]

305

res = b'dh/' + dirs + filler + digest + ext

308

res = b'dh/' + dirs + filler + digest + ext

306

return res

309

return res

307

310

308

311

309

def _hybridencode(path, dotencode):

312

def _hybridencode(path, dotencode):

310

"""encodes path with a length limit

313

"""encodes path with a length limit

311

314

312

Encodes all paths that begin with 'data/', according to the following.

315

Encodes all paths that begin with 'data/', according to the following.

313

316

314

Default encoding (reversible):

317

Default encoding (reversible):

315

318

316

Encodes all uppercase letters 'X' as '_x'. All reserved or illegal

319

Encodes all uppercase letters 'X' as '_x'. All reserved or illegal

317

characters are encoded as '~xx', where xx is the two digit hex code

320

characters are encoded as '~xx', where xx is the two digit hex code

318

of the character (see encodefilename).

321

of the character (see encodefilename).

319

Relevant path components consisting of Windows reserved filenames are

322

Relevant path components consisting of Windows reserved filenames are

320

masked by encoding the third character ('aux' -> 'au~78', see _auxencode).

323

masked by encoding the third character ('aux' -> 'au~78', see _auxencode).

321

324

322

Hashed encoding (not reversible):

325

Hashed encoding (not reversible):

323

326

324

If the default-encoded path is longer than _maxstorepathlen, a

327

If the default-encoded path is longer than _maxstorepathlen, a

325

non-reversible hybrid hashing of the path is done instead.

328

non-reversible hybrid hashing of the path is done instead.

326

This encoding uses up to _dirprefixlen characters of all directory

329

This encoding uses up to _dirprefixlen characters of all directory

327

levels of the lowerencoded path, but not more levels than can fit into

330

levels of the lowerencoded path, but not more levels than can fit into

328

_maxshortdirslen.

331

_maxshortdirslen.

329

Then follows the filler followed by the sha digest of the full path.

332

Then follows the filler followed by the sha digest of the full path.

330

The filler is the beginning of the basename of the lowerencoded path

333

The filler is the beginning of the basename of the lowerencoded path

331

(the basename is everything after the last path separator). The filler

334

(the basename is everything after the last path separator). The filler

332

is as long as possible, filling in characters from the basename until

335

is as long as possible, filling in characters from the basename until

333

the encoded path has _maxstorepathlen characters (or all chars of the

336

the encoded path has _maxstorepathlen characters (or all chars of the

334

basename have been taken).

337

basename have been taken).

335

The extension (e.g. '.i' or '.d') is preserved.

338

The extension (e.g. '.i' or '.d') is preserved.

336

339

337

The string 'data/' at the beginning is replaced with 'dh/', if the hashed

340

The string 'data/' at the beginning is replaced with 'dh/', if the hashed

338

encoding was used.

341

encoding was used.

339

"""

342

"""

340

path = encodedir(path)

343

path = encodedir(path)

341

ef = _encodefname(path).split(b'/')

344

ef = _encodefname(path).split(b'/')

342

res = b'/'.join(_auxencode(ef, dotencode))

345

res = b'/'.join(_auxencode(ef, dotencode))

343

if len(res) > _maxstorepathlen:

346

if len(res) > _maxstorepathlen:

344

res = _hashencode(path, dotencode)

347

res = _hashencode(path, dotencode)

345

return res

348

return res

346

349

347

350

348

def _pathencode(path):

351

def _pathencode(path):

349

de = encodedir(path)

352

de = encodedir(path)

350

if len(path) > _maxstorepathlen:

353

if len(path) > _maxstorepathlen:

351

return _hashencode(de, True)

354

return _hashencode(de, True)

352

ef = _encodefname(de).split(b'/')

355

ef = _encodefname(de).split(b'/')

353

res = b'/'.join(_auxencode(ef, True))

356

res = b'/'.join(_auxencode(ef, True))

354

if len(res) > _maxstorepathlen:

357

if len(res) > _maxstorepathlen:

355

return _hashencode(de, True)

358

return _hashencode(de, True)

356

return res

359

return res

357

360

358

361

359

_pathencode = getattr(parsers, 'pathencode', _pathencode)

362

_pathencode = getattr(parsers, 'pathencode', _pathencode)

360

363

361

364

362

def _plainhybridencode(f):

365

def _plainhybridencode(f):

363

return _hybridencode(f, False)

366

return _hybridencode(f, False)

364

367

365

368

366

def _calcmode(vfs):

369

def _calcmode(vfs):

367

try:

370

try:

368

# files in .hg/ will be created using this mode

371

# files in .hg/ will be created using this mode

369

mode = vfs.stat().st_mode

372

mode = vfs.stat().st_mode

370

# avoid some useless chmods

373

# avoid some useless chmods

371

if (0o777 & ~util.umask) == (0o777 & mode):

374

if (0o777 & ~util.umask) == (0o777 & mode):

372

mode = None

375

mode = None

373

except OSError:

376

except OSError:

374

mode = None

377

mode = None

375

return mode

378

return mode

376

379

377

380

378

_data = [

381

_data = [

379

b'bookmarks',

382

b'bookmarks',

380

b'narrowspec',

383

b'narrowspec',

381

b'data',

384

b'data',

382

b'meta',

385

b'meta',

383

b'00manifest.d',

386

b'00manifest.d',

384

b'00manifest.i',

387

b'00manifest.i',

385

b'00changelog.d',

388

b'00changelog.d',

386

b'00changelog.i',

389

b'00changelog.i',

387

b'phaseroots',

390

b'phaseroots',

388

b'obsstore',

391

b'obsstore',

389

b'requires',

392

b'requires',

390

]

393

]

391

394

392

REVLOG_FILES_EXT = (

395

REVLOG_FILES_EXT = (

393

b'.i',

396

b'.i',

394

b'.idx',

397

b'.idx',

395

b'.d',

398

b'.d',

396

b'.dat',

399

b'.dat',

397

b'.n',

400

b'.n',

398

b'.nd',

401

b'.nd',

399

b'.sda',

402

b'.sda',

400

)

403

)

401

# file extension that also use a `-SOMELONGIDHASH.ext` form

404

# file extension that also use a `-SOMELONGIDHASH.ext` form

402

REVLOG_FILES_LONG_EXT = (

405

REVLOG_FILES_LONG_EXT = (

403

b'.nd',

406

b'.nd',

404

b'.idx',

407

b'.idx',

405

b'.dat',

408

b'.dat',

406

b'.sda',

409

b'.sda',

407

)

410

)

408

# files that are "volatile" and might change between listing and streaming

411

# files that are "volatile" and might change between listing and streaming

409

#

412

#

410

# note: the ".nd" file are nodemap data and won't "change" but they might be

413

# note: the ".nd" file are nodemap data and won't "change" but they might be

411

# deleted.

414

# deleted.

412

REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')

415

REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')

413

416

414

# some exception to the above matching

417

# some exception to the above matching

415

#

418

#

416

# XXX This is currently not in use because of issue6542

419

# XXX This is currently not in use because of issue6542

417

EXCLUDED = re.compile(br'.*undo\.[^/]+\.(nd?|i)$')

420

EXCLUDED = re.compile(br'.*undo\.[^/]+\.(nd?|i)$')

418

421

419

422

420

def is_revlog(f, kind, st):

423

def is_revlog(f, kind, st):

421

if kind != stat.S_IFREG:

424

if kind != stat.S_IFREG:

422

return False

425

return False

423

if f.endswith(REVLOG_FILES_EXT):

426

if f.endswith(REVLOG_FILES_EXT):

424

return True

427

return True

425

return False

428

return False

426

429

427

430

428

def is_revlog_file(f):

431

def is_revlog_file(f):

429

if f.endswith(REVLOG_FILES_EXT):

432

if f.endswith(REVLOG_FILES_EXT):

430

return True

433

return True

431

return False

434

return False

432

435

433

436

434

# the file is part of changelog data

435

FILEFLAGS_CHANGELOG = 1 << 13

436

# the file is part of manifest data

437

FILEFLAGS_MANIFESTLOG = 1 << 12

438

# the file is part of filelog data

439

FILEFLAGS_FILELOG = 1 << 11

440

# file that are not directly part of a revlog

441

FILEFLAGS_OTHER = 1 << 10

442

443

# the main entry point for a revlog

444

FILEFLAGS_REVLOG_MAIN = 1 << 1

445

# a secondary file for a revlog

446

FILEFLAGS_REVLOG_OTHER = 1 << 0

447

448

# files that are "volatile" and might change between listing and streaming

449

FILEFLAGS_VOLATILE = 1 << 20

450

451

FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN

452

FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER

453

FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN

454

FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER

455

FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN

456

FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER

457

FILETYPE_OTHER = FILEFLAGS_OTHER

458

459

460

@attr.s(slots=True)

437

@attr.s(slots=True)

461

class StoreFile:

438

class StoreFile:

462

"""a file matching a store entry"""

439

"""a file matching a store entry"""

463

440

464

unencoded_path = attr.ib()

441

unencoded_path = attr.ib()

465

_file_size = attr.ib(default=None)

442

_file_size = attr.ib(default=None)

466

is_volatile = attr.ib(default=False)

443

is_volatile = attr.ib(default=False)

467

444

468

def file_size(self, vfs):

445

def file_size(self, vfs):

469

if self._file_size is None:

446

if self._file_size is None:

470

if vfs is None:

447

if vfs is None:

471

msg = b"calling vfs-less file_size without prior call: %s"

448

msg = b"calling vfs-less file_size without prior call: %s"

472

msg %= self.unencoded_path

449

msg %= self.unencoded_path

473

raise error.ProgrammingError(msg)

450

raise error.ProgrammingError(msg)

474

try:

451

try:

475

self._file_size = vfs.stat(self.unencoded_path).st_size

452

self._file_size = vfs.stat(self.unencoded_path).st_size

476

except FileNotFoundError:

453

except FileNotFoundError:

477

self._file_size = 0

454

self._file_size = 0

478

return self._file_size

455

return self._file_size

479

456

480

def get_stream(self, vfs, copies):

457

def get_stream(self, vfs, copies):

481

"""return data "stream" information for this file

458

"""return data "stream" information for this file

482

459

483

(unencoded_file_path, content_iterator, content_size)

460

(unencoded_file_path, content_iterator, content_size)

484

"""

461

"""

485

size = self.file_size(None)

462

size = self.file_size(None)

486

463

487

def get_stream():

464

def get_stream():

488

actual_path = copies[vfs.join(self.unencoded_path)]

465

actual_path = copies[vfs.join(self.unencoded_path)]

489

with open(actual_path, 'rb') as fp:

466

with open(actual_path, 'rb') as fp:

490

yield None # ready to stream

467

yield None # ready to stream

491

if size <= 65536:

468

if size <= 65536:

492

yield fp.read(size)

469

yield fp.read(size)

493

else:

470

else:

494

yield from util.filechunkiter(fp, limit=size)

471

yield from util.filechunkiter(fp, limit=size)

495

472

496

s = get_stream()

473

s = get_stream()

497

next(s)

474

next(s)

498

return (self.unencoded_path, s, size)

475

return (self.unencoded_path, s, size)

499

476

500

477

501

@attr.s(slots=True, init=False)

478

@attr.s(slots=True, init=False)

502

class BaseStoreEntry:

479

class BaseStoreEntry:

503

"""An entry in the store

480

"""An entry in the store

504

481

505

This is returned by `store.walk` and represent some data in the store."""

482

This is returned by `store.walk` and represent some data in the store."""

506

483

507

def files(self) -> List[StoreFile]:

484

def files(self) -> List[StoreFile]:

508

raise NotImplementedError

485

raise NotImplementedError

509

486

510

def get_streams(

487

def get_streams(

511

self,

488

self,

512

repo=None,

489

repo=None,

513

vfs=None,

490

vfs=None,

514

copies=None,

491

copies=None,

515

max_changeset=None,

492

max_changeset=None,

516

):

493

):

517

"""return a list of data stream associated to files for this entry

494

"""return a list of data stream associated to files for this entry

518

495

519

return [(unencoded_file_path, content_iterator, content_size), …]

496

return [(unencoded_file_path, content_iterator, content_size), …]

520

"""

497

"""

521

assert vfs is not None

498

assert vfs is not None

522

return [f.get_stream(vfs, copies) for f in self.files()]

499

return [f.get_stream(vfs, copies) for f in self.files()]

523

500

524

501

525

@attr.s(slots=True, init=False)

502

@attr.s(slots=True, init=False)

526

class SimpleStoreEntry(BaseStoreEntry):

503

class SimpleStoreEntry(BaseStoreEntry):

527

"""A generic entry in the store"""

504

"""A generic entry in the store"""

528

505

529

is_revlog = False

506

is_revlog = False

530

507

531

_entry_path = attr.ib()

508

_entry_path = attr.ib()

532

_is_volatile = attr.ib(default=False)

509

_is_volatile = attr.ib(default=False)

533

_file_size = attr.ib(default=None)

510

_file_size = attr.ib(default=None)

534

_files = attr.ib(default=None)

511

_files = attr.ib(default=None)

535

512

536

def __init__(

513

def __init__(

537

self,

514

self,

538

entry_path,

515

entry_path,

539

is_volatile=False,

516

is_volatile=False,

540

file_size=None,

517

file_size=None,

541

):

518

):

542

super().__init__()

519

super().__init__()

543

self._entry_path = entry_path

520

self._entry_path = entry_path

544

self._is_volatile = is_volatile

521

self._is_volatile = is_volatile

545

self._file_size = file_size

522

self._file_size = file_size

546

self._files = None

523

self._files = None

547

524

548

def files(self) -> List[StoreFile]:

525

def files(self) -> List[StoreFile]:

549

if self._files is None:

526

if self._files is None:

550

self._files = [

527

self._files = [

551

StoreFile(

528

StoreFile(

552

unencoded_path=self._entry_path,

529

unencoded_path=self._entry_path,

553

file_size=self._file_size,

530

file_size=self._file_size,

554

is_volatile=self._is_volatile,

531

is_volatile=self._is_volatile,

555

)

532

)

556

]

533

]

557

return self._files

534

return self._files

558

535

559

536

560

@attr.s(slots=True, init=False)

537

@attr.s(slots=True, init=False)

561

class RevlogStoreEntry(BaseStoreEntry):

538

class RevlogStoreEntry(BaseStoreEntry):

562

"""A revlog entry in the store"""

539

"""A revlog entry in the store"""

563

540

564

is_revlog = True

541

is_revlog = True

565

542

566

revlog_type = attr.ib(default=None)

543

revlog_type = attr.ib(default=None)

567

target_id = attr.ib(default=None)

544

target_id = attr.ib(default=None)

568

_path_prefix = attr.ib(default=None)

545

_path_prefix = attr.ib(default=None)

569

_details = attr.ib(default=None)

546

_details = attr.ib(default=None)

570

_files = attr.ib(default=None)

547

_files = attr.ib(default=None)

571

548

572

def __init__(

549

def __init__(

573

self,

550

self,

574

revlog_type,

551

revlog_type,

575

path_prefix,

552

path_prefix,

576

target_id,

553

target_id,

577

details,

554

details,

578

):

555

):

579

super().__init__()

556

super().__init__()

580

self.revlog_type = revlog_type

557

self.revlog_type = revlog_type

581

self.target_id = target_id

558

self.target_id = target_id

582

self._path_prefix = path_prefix

559

self._path_prefix = path_prefix

583

assert b'.i' in details, (path_prefix, details)

560

assert b'.i' in details, (path_prefix, details)

584

self._details = details

561

self._details = details

585

self._files = None

562

self._files = None

586

563

587

@property

564

@property

588

def is_changelog(self):

565

def is_changelog(self):

589

return self.revlog_type & ~~FILEFLAGS~~_CHANGELOG

566

return self.revlog_type == KIND_CHANGELOG

590

567

591

@property

568

@property

592

def is_manifestlog(self):

569

def is_manifestlog(self):

593

return self.revlog_type & ~~FILEFLAGS~~_MANIFESTLOG

570

return self.revlog_type == KIND_MANIFESTLOG

594

571

595

@property

572

@property

596

def is_filelog(self):

573

def is_filelog(self):

597

return self.revlog_type & ~~FILEFLAGS~~_FILELOG

574

return self.revlog_type == KIND_FILELOG

598

575

599

def main_file_path(self):

576

def main_file_path(self):

600

"""unencoded path of the main revlog file"""

577

"""unencoded path of the main revlog file"""

601

return self._path_prefix + b'.i'

578

return self._path_prefix + b'.i'

602

579

603

def files(self) -> List[StoreFile]:

580

def files(self) -> List[StoreFile]:

604

if self._files is None:

581

if self._files is None:

605

self._files = []

582

self._files = []

606

for ext in sorted(self._details, key=_ext_key):

583

for ext in sorted(self._details, key=_ext_key):

607

path = self._path_prefix + ext

584

path = self._path_prefix + ext

608

file_size = self._details[ext]

585

file_size = self._details[ext]

609

# files that are "volatile" and might change between

586

# files that are "volatile" and might change between

610

# listing and streaming

587

# listing and streaming

611

#

588

#

612

# note: the ".nd" file are nodemap data and won't "change"

589

# note: the ".nd" file are nodemap data and won't "change"

613

# but they might be deleted.

590

# but they might be deleted.

614

volatile = ext.endswith(REVLOG_FILES_VOLATILE_EXT)

591

volatile = ext.endswith(REVLOG_FILES_VOLATILE_EXT)

615

f = StoreFile(path, file_size, volatile)

592

f = StoreFile(path, file_size, volatile)

616

self._files.append(f)

593

self._files.append(f)

617

return self._files

594

return self._files

618

595

619

def get_streams(

596

def get_streams(

620

self,

597

self,

621

repo=None,

598

repo=None,

622

vfs=None,

599

vfs=None,

623

copies=None,

600

copies=None,

624

max_changeset=None,

601

max_changeset=None,

625

):

602

):

626

if (

603

if (

627

repo is None

604

repo is None

628

or max_changeset is None

605

or max_changeset is None

629

# This use revlog-v2, ignore for now

606

# This use revlog-v2, ignore for now

630

or any(k.endswith(b'.idx') for k in self._details.keys())

607

or any(k.endswith(b'.idx') for k in self._details.keys())

631

# This is not inline, no race expected

608

# This is not inline, no race expected

632

or b'.d' in self._details

609

or b'.d' in self._details

633

):

610

):

634

return super().get_streams(

611

return super().get_streams(

635

repo=repo,

612

repo=repo,

636

vfs=vfs,

613

vfs=vfs,

637

copies=copies,

614

copies=copies,

638

max_changeset=max_changeset,

615

max_changeset=max_changeset,

639

)

616

)

640

617

641

name_to_size = {}

618

name_to_size = {}

642

for f in self.files():

619

for f in self.files():

643

name_to_size[f.unencoded_path] = f.file_size(None)

620

name_to_size[f.unencoded_path] = f.file_size(None)

644

621

645

stream = [

622

stream = [

646

f.get_stream(vfs, copies)

623

f.get_stream(vfs, copies)

647

for f in self.files()

624

for f in self.files()

648

if not f.unencoded_path.endswith(b'.i')

625

if not f.unencoded_path.endswith(b'.i')

649

]

626

]

650

627

651

index_path = self._path_prefix + b'.i'

628

index_path = self._path_prefix + b'.i'

652

629

653

index_file = None

630

index_file = None

654

try:

631

try:

655

index_file = vfs(index_path)

632

index_file = vfs(index_path)

656

header = index_file.read(INDEX_HEADER.size)

633

header = index_file.read(INDEX_HEADER.size)

657

if revlogmod.revlog.is_inline_index(header):

634

if revlogmod.revlog.is_inline_index(header):

658

size = name_to_size[index_path]

635

size = name_to_size[index_path]

659

636

660

# no split underneath, just return the stream

637

# no split underneath, just return the stream

661

def get_stream():

638

def get_stream():

662

fp = index_file

639

fp = index_file

663

try:

640

try:

664

fp.seek(0)

641

fp.seek(0)

665

yield None

642

yield None

666

if size <= 65536:

643

if size <= 65536:

667

yield fp.read(size)

644

yield fp.read(size)

668

else:

645

else:

669

yield from util.filechunkiter(fp, limit=size)

646

yield from util.filechunkiter(fp, limit=size)

670

finally:

647

finally:

671

fp.close()

648

fp.close()

672

649

673

s = get_stream()

650

s = get_stream()

674

next(s)

651

next(s)

675

index_file = None

652

index_file = None

676

stream.append((index_path, s, size))

653

stream.append((index_path, s, size))

677

else:

654

else:

678

rl = self.get_revlog_instance(repo).get_revlog()

655

rl = self.get_revlog_instance(repo).get_revlog()

679

rl_stream = rl.get_streams(max_changeset, force_inline=True)

656

rl_stream = rl.get_streams(max_changeset, force_inline=True)

680

for name, s, size in rl_stream:

657

for name, s, size in rl_stream:

681

if name_to_size.get(name, 0) != size:

658

if name_to_size.get(name, 0) != size:

682

msg = _(b"expected %d bytes but %d provided for %s")

659

msg = _(b"expected %d bytes but %d provided for %s")

683

msg %= name_to_size.get(name, 0), size, name

660

msg %= name_to_size.get(name, 0), size, name

684

raise error.Abort(msg)

661

raise error.Abort(msg)

685

stream.extend(rl_stream)

662

stream.extend(rl_stream)

686

finally:

663

finally:

687

if index_file is not None:

664

if index_file is not None:

688

index_file.close()

665

index_file.close()

689

666

690

files = self.files()

667

files = self.files()

691

assert len(stream) == len(files), (

668

assert len(stream) == len(files), (

692

stream,

669

stream,

693

files,

670

files,

694

self._path_prefix,

671

self._path_prefix,

695

self.target_id,

672

self.target_id,

696

)

673

)

697

return stream

674

return stream

698

675

699

def get_revlog_instance(self, repo):

676

def get_revlog_instance(self, repo):

700

"""Obtain a revlog instance from this store entry

677

"""Obtain a revlog instance from this store entry

701

678

702

An instance of the appropriate class is returned.

679

An instance of the appropriate class is returned.

703

"""

680

"""

704

if self.is_changelog:

681

if self.is_changelog:

705

return changelog.changelog(repo.svfs)

682

return changelog.changelog(repo.svfs)

706

elif self.is_manifestlog:

683

elif self.is_manifestlog:

707

mandir = self.target_id

684

mandir = self.target_id

708

return manifest.manifestrevlog(

685

return manifest.manifestrevlog(

709

repo.nodeconstants, repo.svfs, tree=mandir

686

repo.nodeconstants, repo.svfs, tree=mandir

710

)

687

)

711

else:

688

else:

712

return filelog.filelog(repo.svfs, self.target_id)

689

return filelog.filelog(repo.svfs, self.target_id)

713

690

714

691

715

def _gather_revlog(files_data):

692

def _gather_revlog(files_data):

716

"""group files per revlog prefix

693

"""group files per revlog prefix

717

694

718

The returns a two level nested dict. The top level key is the revlog prefix

695

The returns a two level nested dict. The top level key is the revlog prefix

719

without extension, the second level is all the file "suffix" that were

696

without extension, the second level is all the file "suffix" that were

720

seen for this revlog and arbitrary file data as value.

697

seen for this revlog and arbitrary file data as value.

721

"""

698

"""

722

revlogs = collections.defaultdict(dict)

699

revlogs = collections.defaultdict(dict)

723

for u, value in files_data:

700

for u, value in files_data:

724

name, ext = _split_revlog_ext(u)

701

name, ext = _split_revlog_ext(u)

725

revlogs[name][ext] = value

702

revlogs[name][ext] = value

726

return sorted(revlogs.items())

703

return sorted(revlogs.items())

727

704

728

705

729

def _split_revlog_ext(filename):

706

def _split_revlog_ext(filename):

730

"""split the revlog file prefix from the variable extension"""

707

"""split the revlog file prefix from the variable extension"""

731

if filename.endswith(REVLOG_FILES_LONG_EXT):

708

if filename.endswith(REVLOG_FILES_LONG_EXT):

732

char = b'-'

709

char = b'-'

733

else:

710

else:

734

char = b'.'

711

char = b'.'

735

idx = filename.rfind(char)

712

idx = filename.rfind(char)

736

return filename[:idx], filename[idx:]

713

return filename[:idx], filename[idx:]

737

714

738

715

739

def _ext_key(ext):

716

def _ext_key(ext):

740

"""a key to order revlog suffix

717

"""a key to order revlog suffix

741

718

742

important to issue .i after other entry."""

719

important to issue .i after other entry."""

743

# the only important part of this order is to keep the `.i` last.

720

# the only important part of this order is to keep the `.i` last.

744

if ext.endswith(b'.n'):

721

if ext.endswith(b'.n'):

745

return (0, ext)

722

return (0, ext)

746

elif ext.endswith(b'.nd'):

723

elif ext.endswith(b'.nd'):

747

return (10, ext)

724

return (10, ext)

748

elif ext.endswith(b'.d'):

725

elif ext.endswith(b'.d'):

749

return (20, ext)

726

return (20, ext)

750

elif ext.endswith(b'.i'):

727

elif ext.endswith(b'.i'):

751

return (50, ext)

728

return (50, ext)

752

else:

729

else:

753

return (40, ext)

730

return (40, ext)

754

731

755

732

756

class basicstore:

733

class basicstore:

757

'''base class for local repository stores'''

734

'''base class for local repository stores'''

758

735

759

def __init__(self, path, vfstype):

736

def __init__(self, path, vfstype):

760

vfs = vfstype(path)

737

vfs = vfstype(path)

761

self.path = vfs.base

738

self.path = vfs.base

762

self.createmode = _calcmode(vfs)

739

self.createmode = _calcmode(vfs)

763

vfs.createmode = self.createmode

740

vfs.createmode = self.createmode

764

self.rawvfs = vfs

741

self.rawvfs = vfs

765

self.vfs = vfsmod.filtervfs(vfs, encodedir)

742

self.vfs = vfsmod.filtervfs(vfs, encodedir)

766

self.opener = self.vfs

743

self.opener = self.vfs

767

744

768

def join(self, f):

745

def join(self, f):

769

return self.path + b'/' + encodedir(f)

746

return self.path + b'/' + encodedir(f)

770

747

771

def _walk(self, relpath, recurse, undecodable=None):

748

def _walk(self, relpath, recurse, undecodable=None):

772

'''yields (revlog_type, unencoded, size)'''

749

'''yields (revlog_type, unencoded, size)'''

773

path = self.path

750

path = self.path

774

if relpath:

751

if relpath:

775

path += b'/' + relpath

752

path += b'/' + relpath

776

striplen = len(self.path) + 1

753

striplen = len(self.path) + 1

777

l = []

754

l = []

778

if self.rawvfs.isdir(path):

755

if self.rawvfs.isdir(path):

779

visit = [path]

756

visit = [path]

780

readdir = self.rawvfs.readdir

757

readdir = self.rawvfs.readdir

781

while visit:

758

while visit:

782

p = visit.pop()

759

p = visit.pop()

783

for f, kind, st in readdir(p, stat=True):

760

for f, kind, st in readdir(p, stat=True):

784

fp = p + b'/' + f

761

fp = p + b'/' + f

785

if is_revlog(f, kind, st):

762

if is_revlog(f, kind, st):

786

n = util.pconvert(fp[striplen:])

763

n = util.pconvert(fp[striplen:])

787

l.append((decodedir(n), st.st_size))

764

l.append((decodedir(n), st.st_size))

788

elif kind == stat.S_IFDIR and recurse:

765

elif kind == stat.S_IFDIR and recurse:

789

visit.append(fp)

766

visit.append(fp)

790

767

791

l.sort()

768

l.sort()

792

return l

769

return l

793

770

794

def changelog(self, trypending, concurrencychecker=None):

771

def changelog(self, trypending, concurrencychecker=None):

795

return changelog.changelog(

772

return changelog.changelog(

796

self.vfs,

773

self.vfs,

797

trypending=trypending,

774

trypending=trypending,

798

concurrencychecker=concurrencychecker,

775

concurrencychecker=concurrencychecker,

799

)

776

)

800

777

801

def manifestlog(self, repo, storenarrowmatch):

778

def manifestlog(self, repo, storenarrowmatch):

802

rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)

779

rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)

803

return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)

780

return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)

804

781

805

def data_entries(

782

def data_entries(

806

self, matcher=None, undecodable=None

783

self, matcher=None, undecodable=None

807

) -> Generator[BaseStoreEntry, None, None]:

784

) -> Generator[BaseStoreEntry, None, None]:

808

"""Like walk, but excluding the changelog and root manifest.

785

"""Like walk, but excluding the changelog and root manifest.

809

786

810

When [undecodable] is None, revlogs names that can't be

787

When [undecodable] is None, revlogs names that can't be

811

decoded cause an exception. When it is provided, it should

788

decoded cause an exception. When it is provided, it should

812

be a list and the filenames that can't be decoded are added

789

be a list and the filenames that can't be decoded are added

813

to it instead. This is very rarely needed."""

790

to it instead. This is very rarely needed."""

814

dirs = [

791

dirs = [

815

(b'data', ~~FILEFLAGS~~_FILELOG, False),

792

(b'data', KIND_FILELOG, False),

816

(b'meta', ~~FILEFLAGS~~_MANIFESTLOG, True),

793

(b'meta', KIND_MANIFESTLOG, True),

817

]

794

]

818

for base_dir, rl_type, strip_filename in dirs:

795

for base_dir, rl_type, strip_filename in dirs:

819

files = self._walk(base_dir, True, undecodable=undecodable)

796

files = self._walk(base_dir, True, undecodable=undecodable)

820

for revlog, details in _gather_revlog(files):

797

for revlog, details in _gather_revlog(files):

821

revlog_target_id = revlog.split(b'/', 1)[1]

798

revlog_target_id = revlog.split(b'/', 1)[1]

822

if strip_filename and b'/' in revlog:

799

if strip_filename and b'/' in revlog:

823

revlog_target_id = revlog_target_id.rsplit(b'/', 1)[0]

800

revlog_target_id = revlog_target_id.rsplit(b'/', 1)[0]

824

revlog_target_id += b'/'

801

revlog_target_id += b'/'

825

yield RevlogStoreEntry(

802

yield RevlogStoreEntry(

826

path_prefix=revlog,

803

path_prefix=revlog,

827

revlog_type=rl_type,

804

revlog_type=rl_type,

828

target_id=revlog_target_id,

805

target_id=revlog_target_id,

829

details=details,

806

details=details,

830

)

807

)

831

808

832

def top_entries(

809

def top_entries(

833

self, phase=False, obsolescence=False

810

self, phase=False, obsolescence=False

834

) -> Generator[BaseStoreEntry, None, None]:

811

) -> Generator[BaseStoreEntry, None, None]:

835

if phase and self.vfs.exists(b'phaseroots'):

812

if phase and self.vfs.exists(b'phaseroots'):

836

yield SimpleStoreEntry(

813

yield SimpleStoreEntry(

837

entry_path=b'phaseroots',

814

entry_path=b'phaseroots',

838

is_volatile=True,

815

is_volatile=True,

839

)

816

)

840

817

841

if obsolescence and self.vfs.exists(b'obsstore'):

818

if obsolescence and self.vfs.exists(b'obsstore'):

842

# XXX if we had the file size it could be non-volatile

819

# XXX if we had the file size it could be non-volatile

843

yield SimpleStoreEntry(

820

yield SimpleStoreEntry(

844

entry_path=b'obsstore',

821

entry_path=b'obsstore',

845

is_volatile=True,

822

is_volatile=True,

846

)

823

)

847

824

848

files = reversed(self._walk(b'', False))

825

files = reversed(self._walk(b'', False))

849

826

850

changelogs = collections.defaultdict(dict)

827

changelogs = collections.defaultdict(dict)

851

manifestlogs = collections.defaultdict(dict)

828

manifestlogs = collections.defaultdict(dict)

852

829

853

for u, s in files:

830

for u, s in files:

854

if u.startswith(b'00changelog'):

831

if u.startswith(b'00changelog'):

855

name, ext = _split_revlog_ext(u)

832

name, ext = _split_revlog_ext(u)

856

changelogs[name][ext] = s

833

changelogs[name][ext] = s

857

elif u.startswith(b'00manifest'):

834

elif u.startswith(b'00manifest'):

858

name, ext = _split_revlog_ext(u)

835

name, ext = _split_revlog_ext(u)

859

manifestlogs[name][ext] = s

836

manifestlogs[name][ext] = s

860

else:

837

else:

861

yield SimpleStoreEntry(

838

yield SimpleStoreEntry(

862

entry_path=u,

839

entry_path=u,

863

is_volatile=False,

840

is_volatile=False,

864

file_size=s,

841

file_size=s,

865

)

842

)

866

# yield manifest before changelog

843

# yield manifest before changelog

867

top_rl = [

844

top_rl = [

868

(manifestlogs, ~~FILEFLAGS~~_MANIFESTLOG),

845

(manifestlogs, KIND_MANIFESTLOG),

869

(changelogs, ~~FILEFLAGS~~_CHANGELOG),

846

(changelogs, KIND_CHANGELOG),

870

]

847

]

871

assert len(manifestlogs) <= 1

848

assert len(manifestlogs) <= 1

872

assert len(changelogs) <= 1

849

assert len(changelogs) <= 1

873

for data, revlog_type in top_rl:

850

for data, revlog_type in top_rl:

874

for revlog, details in sorted(data.items()):

851

for revlog, details in sorted(data.items()):

875

yield RevlogStoreEntry(

852

yield RevlogStoreEntry(

876

path_prefix=revlog,

853

path_prefix=revlog,

877

revlog_type=revlog_type,

854

revlog_type=revlog_type,

878

target_id=b'',

855

target_id=b'',

879

details=details,

856

details=details,

880

)

857

)

881

858

882

def walk(

859

def walk(

883

self, matcher=None, phase=False, obsolescence=False

860

self, matcher=None, phase=False, obsolescence=False

884

) -> Generator[BaseStoreEntry, None, None]:

861

) -> Generator[BaseStoreEntry, None, None]:

885

"""return files related to data storage (ie: revlogs)

862

"""return files related to data storage (ie: revlogs)

886

863

887

yields instance from BaseStoreEntry subclasses

864

yields instance from BaseStoreEntry subclasses

888

865

889

if a matcher is passed, storage files of only those tracked paths

866

if a matcher is passed, storage files of only those tracked paths

890

are passed with matches the matcher

867

are passed with matches the matcher

891

"""

868

"""

892

# yield data files first

869

# yield data files first

893

for x in self.data_entries(matcher):

870

for x in self.data_entries(matcher):

894

yield x

871

yield x

895

for x in self.top_entries(phase=phase, obsolescence=obsolescence):

872

for x in self.top_entries(phase=phase, obsolescence=obsolescence):

896

yield x

873

yield x

897

874

898

def copylist(self):

875

def copylist(self):

899

return _data

876

return _data

900

877

901

def write(self, tr):

878

def write(self, tr):

902

pass

879

pass

903

880

904

def invalidatecaches(self):

881

def invalidatecaches(self):

905

pass

882

pass

906

883

907

def markremoved(self, fn):

884

def markremoved(self, fn):

908

pass

885

pass

909

886

910

def __contains__(self, path):

887

def __contains__(self, path):

911

'''Checks if the store contains path'''

888

'''Checks if the store contains path'''

912

path = b"/".join((b"data", path))

889

path = b"/".join((b"data", path))

913

# file?

890

# file?

914

if self.vfs.exists(path + b".i"):

891

if self.vfs.exists(path + b".i"):

915

return True

892

return True

916

# dir?

893

# dir?

917

if not path.endswith(b"/"):

894

if not path.endswith(b"/"):

918

path = path + b"/"

895

path = path + b"/"

919

return self.vfs.exists(path)

896

return self.vfs.exists(path)

920

897

921

898

922

class encodedstore(basicstore):

899

class encodedstore(basicstore):

923

def __init__(self, path, vfstype):

900

def __init__(self, path, vfstype):

924

vfs = vfstype(path + b'/store')

901

vfs = vfstype(path + b'/store')

925

self.path = vfs.base

902

self.path = vfs.base

926

self.createmode = _calcmode(vfs)

903

self.createmode = _calcmode(vfs)

927

vfs.createmode = self.createmode

904

vfs.createmode = self.createmode

928

self.rawvfs = vfs

905

self.rawvfs = vfs

929

self.vfs = vfsmod.filtervfs(vfs, encodefilename)

906

self.vfs = vfsmod.filtervfs(vfs, encodefilename)

930

self.opener = self.vfs

907

self.opener = self.vfs

931

908

932

def _walk(self, relpath, recurse, undecodable=None):

909

def _walk(self, relpath, recurse, undecodable=None):

933

old = super()._walk(relpath, recurse)

910

old = super()._walk(relpath, recurse)

934

new = []

911

new = []

935

for f1, value in old:

912

for f1, value in old:

936

try:

913

try:

937

f2 = decodefilename(f1)

914

f2 = decodefilename(f1)

938

except KeyError:

915

except KeyError:

939

if undecodable is None:

916

if undecodable is None:

940

msg = _(b'undecodable revlog name %s') % f1

917

msg = _(b'undecodable revlog name %s') % f1

941

raise error.StorageError(msg)

918

raise error.StorageError(msg)

942

else:

919

else:

943

undecodable.append(f1)

920

undecodable.append(f1)

944

continue

921

continue

945

new.append((f2, value))

922

new.append((f2, value))

946

return new

923

return new

947

924

948

def data_entries(

925

def data_entries(

949

self, matcher=None, undecodable=None

926

self, matcher=None, undecodable=None

950

) -> Generator[BaseStoreEntry, None, None]:

927

) -> Generator[BaseStoreEntry, None, None]:

951

entries = super(encodedstore, self).data_entries(

928

entries = super(encodedstore, self).data_entries(

952

undecodable=undecodable

929

undecodable=undecodable

953

)

930

)

954

for entry in entries:

931

for entry in entries:

955

if _match_tracked_entry(entry, matcher):

932

if _match_tracked_entry(entry, matcher):

956

yield entry

933

yield entry

957

934

958

def join(self, f):

935

def join(self, f):

959

return self.path + b'/' + encodefilename(f)

936

return self.path + b'/' + encodefilename(f)

960

937

961

def copylist(self):

938

def copylist(self):

962

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]

939

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]

963

940

964

941

965

class fncache:

942

class fncache:

966

# the filename used to be partially encoded

943

# the filename used to be partially encoded

967

# hence the encodedir/decodedir dance

944

# hence the encodedir/decodedir dance

968

def __init__(self, vfs):

945

def __init__(self, vfs):

969

self.vfs = vfs

946

self.vfs = vfs

970

self._ignores = set()

947

self._ignores = set()

971

self.entries = None

948

self.entries = None

972

self._dirty = False

949

self._dirty = False

973

# set of new additions to fncache

950

# set of new additions to fncache

974

self.addls = set()

951

self.addls = set()

975

952

976

def ensureloaded(self, warn=None):

953

def ensureloaded(self, warn=None):

977

"""read the fncache file if not already read.

954

"""read the fncache file if not already read.

978

955

979

If the file on disk is corrupted, raise. If warn is provided,

956

If the file on disk is corrupted, raise. If warn is provided,

980

warn and keep going instead."""

957

warn and keep going instead."""

981

if self.entries is None:

958

if self.entries is None:

982

self._load(warn)

959

self._load(warn)

983

960

984

def _load(self, warn=None):

961

def _load(self, warn=None):

985

'''fill the entries from the fncache file'''

962

'''fill the entries from the fncache file'''

986

self._dirty = False

963

self._dirty = False

987

try:

964

try:

988

fp = self.vfs(b'fncache', mode=b'rb')

965

fp = self.vfs(b'fncache', mode=b'rb')

989

except IOError:

966

except IOError:

990

# skip nonexistent file

967

# skip nonexistent file

991

self.entries = set()

968

self.entries = set()

992

return

969

return

993

970

994

self.entries = set()

971

self.entries = set()

995

chunk = b''

972

chunk = b''

996

for c in iter(functools.partial(fp.read, fncache_chunksize), b''):

973

for c in iter(functools.partial(fp.read, fncache_chunksize), b''):

997

chunk += c

974

chunk += c

998

try:

975

try:

999

p = chunk.rindex(b'\n')

976

p = chunk.rindex(b'\n')

1000

self.entries.update(decodedir(chunk[: p + 1]).splitlines())

977

self.entries.update(decodedir(chunk[: p + 1]).splitlines())

1001

chunk = chunk[p + 1 :]

978

chunk = chunk[p + 1 :]

1002

except ValueError:

979

except ValueError:

1003

# substring '\n' not found, maybe the entry is bigger than the

980

# substring '\n' not found, maybe the entry is bigger than the

1004

# chunksize, so let's keep iterating

981

# chunksize, so let's keep iterating

1005

pass

982

pass

1006

983

1007

if chunk:

984

if chunk:

1008

msg = _(b"fncache does not ends with a newline")

985

msg = _(b"fncache does not ends with a newline")

1009

if warn:

986

if warn:

1010

warn(msg + b'\n')

987

warn(msg + b'\n')

1011

else:

988

else:

1012

raise error.Abort(

989

raise error.Abort(

1013

msg,

990

msg,

1014

hint=_(

991

hint=_(

1015

b"use 'hg debugrebuildfncache' to "

992

b"use 'hg debugrebuildfncache' to "

1016

b"rebuild the fncache"

993

b"rebuild the fncache"

1017

),

994

),

1018

)

995

)

1019

self._checkentries(fp, warn)

996

self._checkentries(fp, warn)

1020

fp.close()

997

fp.close()

1021

998

1022

def _checkentries(self, fp, warn):

999

def _checkentries(self, fp, warn):

1023

"""make sure there is no empty string in entries"""

1000

"""make sure there is no empty string in entries"""

1024

if b'' in self.entries:

1001

if b'' in self.entries:

1025

fp.seek(0)

1002

fp.seek(0)

1026

for n, line in enumerate(fp):

1003

for n, line in enumerate(fp):

1027

if not line.rstrip(b'\n'):

1004

if not line.rstrip(b'\n'):

1028

t = _(b'invalid entry in fncache, line %d') % (n + 1)

1005

t = _(b'invalid entry in fncache, line %d') % (n + 1)

1029

if warn:

1006

if warn:

1030

warn(t + b'\n')

1007

warn(t + b'\n')

1031

else:

1008

else:

1032

raise error.Abort(t)

1009

raise error.Abort(t)

1033

1010

1034

def write(self, tr):

1011

def write(self, tr):

1035

if self._dirty:

1012

if self._dirty:

1036

assert self.entries is not None

1013

assert self.entries is not None

1037

self.entries = self.entries | self.addls

1014

self.entries = self.entries | self.addls

1038

self.addls = set()

1015

self.addls = set()

1039

tr.addbackup(b'fncache')

1016

tr.addbackup(b'fncache')

1040

fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)

1017

fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)

1041

if self.entries:

1018

if self.entries:

1042

fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))

1019

fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))

1043

fp.close()

1020

fp.close()

1044

self._dirty = False

1021

self._dirty = False

1045

if self.addls:

1022

if self.addls:

1046

# if we have just new entries, let's append them to the fncache

1023

# if we have just new entries, let's append them to the fncache

1047

tr.addbackup(b'fncache')

1024

tr.addbackup(b'fncache')

1048

fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)

1025

fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)

1049

if self.addls:

1026

if self.addls:

1050

fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))

1027

fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))

1051

fp.close()

1028

fp.close()

1052

self.entries = None

1029

self.entries = None

1053

self.addls = set()

1030

self.addls = set()

1054

1031

1055

def addignore(self, fn):

1032

def addignore(self, fn):

1056

self._ignores.add(fn)

1033

self._ignores.add(fn)

1057

1034

1058

def add(self, fn):

1035

def add(self, fn):

1059

if fn in self._ignores:

1036

if fn in self._ignores:

1060

return

1037

return

1061

if self.entries is None:

1038

if self.entries is None:

1062

self._load()

1039

self._load()

1063

if fn not in self.entries:

1040

if fn not in self.entries:

1064

self.addls.add(fn)

1041

self.addls.add(fn)

1065

1042

1066

def remove(self, fn):

1043

def remove(self, fn):

1067

if self.entries is None:

1044

if self.entries is None:

1068

self._load()

1045

self._load()

1069

if fn in self.addls:

1046

if fn in self.addls:

1070

self.addls.remove(fn)

1047

self.addls.remove(fn)

1071

return

1048

return

1072

try:

1049

try:

1073

self.entries.remove(fn)

1050

self.entries.remove(fn)

1074

self._dirty = True

1051

self._dirty = True

1075

except KeyError:

1052

except KeyError:

1076

pass

1053

pass

1077

1054

1078

def __contains__(self, fn):

1055

def __contains__(self, fn):

1079

if fn in self.addls:

1056

if fn in self.addls:

1080

return True

1057

return True

1081

if self.entries is None:

1058

if self.entries is None:

1082

self._load()

1059

self._load()

1083

return fn in self.entries

1060

return fn in self.entries

1084

1061

1085

def __iter__(self):

1062

def __iter__(self):

1086

if self.entries is None:

1063

if self.entries is None:

1087

self._load()

1064

self._load()

1088

return iter(self.entries | self.addls)

1065

return iter(self.entries | self.addls)

1089

1066

1090

1067

1091

class _fncachevfs(vfsmod.proxyvfs):

1068

class _fncachevfs(vfsmod.proxyvfs):

1092

def __init__(self, vfs, fnc, encode):

1069

def __init__(self, vfs, fnc, encode):

1093

vfsmod.proxyvfs.__init__(self, vfs)

1070

vfsmod.proxyvfs.__init__(self, vfs)

1094

self.fncache = fnc

1071

self.fncache = fnc

1095

self.encode = encode

1072

self.encode = encode

1096

1073

1097

def __call__(self, path, mode=b'r', *args, **kw):

1074

def __call__(self, path, mode=b'r', *args, **kw):

1098

encoded = self.encode(path)

1075

encoded = self.encode(path)

1099

if (

1076

if (

1100

mode not in (b'r', b'rb')

1077

mode not in (b'r', b'rb')

1101

and (path.startswith(b'data/') or path.startswith(b'meta/'))

1078

and (path.startswith(b'data/') or path.startswith(b'meta/'))

1102

and is_revlog_file(path)

1079

and is_revlog_file(path)

1103

):

1080

):

1104

# do not trigger a fncache load when adding a file that already is

1081

# do not trigger a fncache load when adding a file that already is

1105

# known to exist.

1082

# known to exist.

1106

notload = self.fncache.entries is None and self.vfs.exists(encoded)

1083

notload = self.fncache.entries is None and self.vfs.exists(encoded)

1107

if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:

1084

if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:

1108

# when appending to an existing file, if the file has size zero,

1085

# when appending to an existing file, if the file has size zero,

1109

# it should be considered as missing. Such zero-size files are

1086

# it should be considered as missing. Such zero-size files are

1110

# the result of truncation when a transaction is aborted.

1087

# the result of truncation when a transaction is aborted.

1111

notload = False

1088

notload = False

1112

if not notload:

1089

if not notload:

1113

self.fncache.add(path)

1090

self.fncache.add(path)

1114

return self.vfs(encoded, mode, *args, **kw)

1091

return self.vfs(encoded, mode, *args, **kw)

1115

1092

1116

def join(self, path):

1093

def join(self, path):

1117

if path:

1094

if path:

1118

return self.vfs.join(self.encode(path))

1095

return self.vfs.join(self.encode(path))

1119

else:

1096

else:

1120

return self.vfs.join(path)

1097

return self.vfs.join(path)

1121

1098

1122

def register_file(self, path):

1099

def register_file(self, path):

1123

"""generic hook point to lets fncache steer its stew"""

1100

"""generic hook point to lets fncache steer its stew"""

1124

if path.startswith(b'data/') or path.startswith(b'meta/'):

1101

if path.startswith(b'data/') or path.startswith(b'meta/'):

1125

self.fncache.add(path)

1102

self.fncache.add(path)

1126

1103

1127

1104

1128

class fncachestore(basicstore):

1105

class fncachestore(basicstore):

1129

def __init__(self, path, vfstype, dotencode):

1106

def __init__(self, path, vfstype, dotencode):

1130

if dotencode:

1107

if dotencode:

1131

encode = _pathencode

1108

encode = _pathencode

1132

else:

1109

else:

1133

encode = _plainhybridencode

1110

encode = _plainhybridencode

1134

self.encode = encode

1111

self.encode = encode

1135

vfs = vfstype(path + b'/store')

1112

vfs = vfstype(path + b'/store')

1136

self.path = vfs.base

1113

self.path = vfs.base

1137

self.pathsep = self.path + b'/'

1114

self.pathsep = self.path + b'/'

1138

self.createmode = _calcmode(vfs)

1115

self.createmode = _calcmode(vfs)

1139

vfs.createmode = self.createmode

1116

vfs.createmode = self.createmode

1140

self.rawvfs = vfs

1117

self.rawvfs = vfs

1141

fnc = fncache(vfs)

1118

fnc = fncache(vfs)

1142

self.fncache = fnc

1119

self.fncache = fnc

1143

self.vfs = _fncachevfs(vfs, fnc, encode)

1120

self.vfs = _fncachevfs(vfs, fnc, encode)

1144

self.opener = self.vfs

1121

self.opener = self.vfs

1145

1122

1146

def join(self, f):

1123

def join(self, f):

1147

return self.pathsep + self.encode(f)

1124

return self.pathsep + self.encode(f)

1148

1125

1149

def getsize(self, path):

1126

def getsize(self, path):

1150

return self.rawvfs.stat(path).st_size

1127

return self.rawvfs.stat(path).st_size

1151

1128

1152

def data_entries(

1129

def data_entries(

1153

self, matcher=None, undecodable=None

1130

self, matcher=None, undecodable=None

1154

) -> Generator[BaseStoreEntry, None, None]:

1131

) -> Generator[BaseStoreEntry, None, None]:

1155

# Note: all files in fncache should be revlog related, However the

1132

# Note: all files in fncache should be revlog related, However the

1156

# fncache might contains such file added by previous version of

1133

# fncache might contains such file added by previous version of

1157

# Mercurial.

1134

# Mercurial.

1158

files = ((f, None) for f in self.fncache if is_revlog_file(f))

1135

files = ((f, None) for f in self.fncache if is_revlog_file(f))

1159

by_revlog = _gather_revlog(files)

1136

by_revlog = _gather_revlog(files)

1160

for revlog, details in by_revlog:

1137

for revlog, details in by_revlog:

1161

if revlog.startswith(b'data/'):

1138

if revlog.startswith(b'data/'):

1162

rl_type = ~~FILEFLAGS~~_FILELOG

1139

rl_type = KIND_FILELOG

1163

revlog_target_id = revlog.split(b'/', 1)[1]

1140

revlog_target_id = revlog.split(b'/', 1)[1]

1164

elif revlog.startswith(b'meta/'):

1141

elif revlog.startswith(b'meta/'):

1165

rl_type = ~~FILEFLAGS~~_MANIFESTLOG

1142

rl_type = KIND_MANIFESTLOG

1166

# drop the initial directory and the `00manifest` file part

1143

# drop the initial directory and the `00manifest` file part

1167

tmp = revlog.split(b'/', 1)[1]

1144

tmp = revlog.split(b'/', 1)[1]

1168

revlog_target_id = tmp.rsplit(b'/', 1)[0] + b'/'

1145

revlog_target_id = tmp.rsplit(b'/', 1)[0] + b'/'

1169

else:

1146

else:

1170

# unreachable

1147

# unreachable

1171

assert False, revlog

1148

assert False, revlog

1172

entry = RevlogStoreEntry(

1149

entry = RevlogStoreEntry(

1173

path_prefix=revlog,

1150

path_prefix=revlog,

1174

revlog_type=rl_type,

1151

revlog_type=rl_type,

1175

target_id=revlog_target_id,

1152

target_id=revlog_target_id,

1176

details=details,

1153

details=details,

1177

)

1154

)

1178

if _match_tracked_entry(entry, matcher):

1155

if _match_tracked_entry(entry, matcher):

1179

yield entry

1156

yield entry

1180

1157

1181

def copylist(self):

1158

def copylist(self):

1182

d = (

1159

d = (

1183

b'bookmarks',

1160

b'bookmarks',

1184

b'narrowspec',

1161

b'narrowspec',

1185

b'data',

1162

b'data',

1186

b'meta',

1163

b'meta',

1187

b'dh',

1164

b'dh',

1188

b'fncache',

1165

b'fncache',

1189

b'phaseroots',

1166

b'phaseroots',

1190

b'obsstore',

1167

b'obsstore',

1191

b'00manifest.d',

1168

b'00manifest.d',

1192

b'00manifest.i',

1169

b'00manifest.i',

1193

b'00changelog.d',

1170

b'00changelog.d',

1194

b'00changelog.i',

1171

b'00changelog.i',

1195

b'requires',

1172

b'requires',

1196

)

1173

)

1197

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]

1174

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]

1198

1175

1199

def write(self, tr):

1176

def write(self, tr):

1200

self.fncache.write(tr)

1177

self.fncache.write(tr)

1201

1178

1202

def invalidatecaches(self):

1179

def invalidatecaches(self):

1203

self.fncache.entries = None

1180

self.fncache.entries = None

1204

self.fncache.addls = set()

1181

self.fncache.addls = set()

1205

1182

1206

def markremoved(self, fn):

1183

def markremoved(self, fn):

1207

self.fncache.remove(fn)

1184

self.fncache.remove(fn)

1208

1185

1209

def _exists(self, f):

1186

def _exists(self, f):

1210

ef = self.encode(f)

1187

ef = self.encode(f)

1211

try:

1188

try:

1212

self.getsize(ef)

1189

self.getsize(ef)

1213

return True

1190

return True

1214

except FileNotFoundError:

1191

except FileNotFoundError:

1215

return False

1192

return False

1216

1193

1217

def __contains__(self, path):

1194

def __contains__(self, path):

1218

'''Checks if the store contains path'''

1195

'''Checks if the store contains path'''

1219

path = b"/".join((b"data", path))

1196

path = b"/".join((b"data", path))

1220

# check for files (exact match)

1197

# check for files (exact match)

1221

e = path + b'.i'

1198

e = path + b'.i'

1222

if e in self.fncache and self._exists(e):

1199

if e in self.fncache and self._exists(e):

1223

return True

1200

return True

1224

# now check for directories (prefix match)

1201

# now check for directories (prefix match)

1225

if not path.endswith(b'/'):

1202

if not path.endswith(b'/'):

1226

path += b'/'

1203

path += b'/'

1227

for e in self.fncache:

1204

for e in self.fncache:

1228

if e.startswith(path) and self._exists(e):

1205

if e.startswith(path) and self._exists(e):

1229

return True

1206

return True

1230

return False

1207

return False

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

-            # store.py - repository store handling for Mercurial
+            # store.py - repository store handling for Mercurial)
             #
             # Copyright 2008 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             import collections
             import functools
             import os
             import re
             import stat
             from typing import Generator, List
             from .i18n import _
             from .pycompat import getattr
             from .thirdparty import attr
             from .node import hex
             from .revlogutils.constants import (
                 INDEX_HEADER,
+                KIND_CHANGELOG,
+                KIND_FILELOG,
+                KIND_MANIFESTLOG,
             )
             from . import (
                 changelog,
                 error,
                 filelog,
                 manifest,
                 policy,
                 pycompat,
                 revlog as revlogmod,
                 util,
                 vfs as vfsmod,
             )
             from .utils import hashutil
             parsers = policy.importmod('parsers')
             # how much bytes should be read from fncache in one read
             # It is done to prevent loading large fncache files into memory
             fncache_chunksize = 10 ** 6
             def _match_tracked_entry(entry, matcher):
                 """parses a fncache entry and returns whether the entry is tracking a path
                 matched by matcher or not.
                 If matcher is None, returns True"""
                 if matcher is None:
                     return True
                 if entry.is_filelog:
                     return matcher(entry.target_id)
                 elif entry.is_manifestlog:
                     return matcher.visitdir(entry.target_id.rstrip(b'/'))
                 raise error.ProgrammingError(b"cannot process entry %r" % entry)
             # This avoids a collision between a file named foo and a dir named
             # foo.i or foo.d
             def _encodedir(path):
                 """
                 >>> _encodedir(b'data/foo.i')
                 'data/foo.i'
                 >>> _encodedir(b'data/foo.i/bla.i')
                 'data/foo.i.hg/bla.i'
                 >>> _encodedir(b'data/foo.i.hg/bla.i')
                 'data/foo.i.hg.hg/bla.i'
                 >>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')
                 'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'
                 """
                 return (
                     path.replace(b".hg/", b".hg.hg/")
                     .replace(b".i/", b".i.hg/")
                     .replace(b".d/", b".d.hg/")
                 )
             encodedir = getattr(parsers, 'encodedir', _encodedir)
             def decodedir(path):
                 """
                 >>> decodedir(b'data/foo.i')
                 'data/foo.i'
                 >>> decodedir(b'data/foo.i.hg/bla.i')
                 'data/foo.i/bla.i'
                 >>> decodedir(b'data/foo.i.hg.hg/bla.i')
                 'data/foo.i.hg/bla.i'
                 """
                 if b".hg/" not in path:
                     return path
                 return (
                     path.replace(b".d.hg/", b".d/")
                     .replace(b".i.hg/", b".i/")
                     .replace(b".hg.hg/", b".hg/")
                 )
             def _reserved():
                 """characters that are problematic for filesystems
                 * ascii escapes (0..31)
                 * ascii hi (126..255)
                 * windows specials
                 these characters will be escaped by encodefunctions
                 """
                 winreserved = [ord(x) for x in u'\\:*?"<>|']
                 for x in range(32):
                     yield x
                 for x in range(126, 256):
                     yield x
                 for x in winreserved:
                     yield x
             def _buildencodefun():
                 """
                 >>> enc, dec = _buildencodefun()
                 >>> enc(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> dec(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> enc(b'HELLO')
                 '_h_e_l_l_o'
                 >>> dec(b'_h_e_l_l_o')
                 'HELLO'
                 >>> enc(b'hello:world?')
                 'hello~3aworld~3f'
                 >>> dec(b'hello~3aworld~3f')
                 'hello:world?'
                 >>> enc(b'the\\x07quick\\xADshot')
                 'the~07quick~adshot'
                 >>> dec(b'the~07quick~adshot')
                 'the\\x07quick\\xadshot'
                 """
                 e = b'_'
                 xchr = pycompat.bytechr
                 asciistr = list(map(xchr, range(127)))
                 capitals = list(range(ord(b"A"), ord(b"Z") + 1))
                 cmap = {x: x for x in asciistr}
                 for x in _reserved():
                     cmap[xchr(x)] = b"~%02x" % x
                 for x in capitals + [ord(e)]:
                     cmap[xchr(x)] = e + xchr(x).lower()
                 dmap = {}
                 for k, v in cmap.items():
                     dmap[v] = k
                 def decode(s):
                     i = 0
                     while i < len(s):
                         for l in range(1, 4):
                             try:
                                 yield dmap[s[i : i + l]]
                                 i += l
                                 break
                             except KeyError:
                                 pass
                         else:
                             raise KeyError
                 return (
                     lambda s: b''.join([cmap[s[c : c + 1]] for c in range(len(s))]),
                     lambda s: b''.join(list(decode(s))),
                 )
             _encodefname, _decodefname = _buildencodefun()
             def encodefilename(s):
                 """
                 >>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')
                 'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'
                 """
                 return _encodefname(encodedir(s))
             def decodefilename(s):
                 """
                 >>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')
                 'foo.i/bar.d/bla.hg/hi:world?/HELLO'
                 """
                 return decodedir(_decodefname(s))
             def _buildlowerencodefun():
                 """
                 >>> f = _buildlowerencodefun()
                 >>> f(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> f(b'HELLO')
                 'hello'
                 >>> f(b'hello:world?')
                 'hello~3aworld~3f'
                 >>> f(b'the\\x07quick\\xADshot')
                 'the~07quick~adshot'
                 """
                 xchr = pycompat.bytechr
                 cmap = {xchr(x): xchr(x) for x in range(127)}
                 for x in _reserved():
                     cmap[xchr(x)] = b"~%02x" % x
                 for x in range(ord(b"A"), ord(b"Z") + 1):
                     cmap[xchr(x)] = xchr(x).lower()
                 def lowerencode(s):
                     return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])
                 return lowerencode
             lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()
             # Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9
             _winres3 = (b'aux', b'con', b'prn', b'nul')  # length 3
             _winres4 = (b'com', b'lpt')  # length 4 (with trailing 1..9)
             def _auxencode(path, dotencode):
                 """
                 Encodes filenames containing names reserved by Windows or which end in
                 period or space. Does not touch other single reserved characters c.
                 Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.
                 Additionally encodes space or period at the beginning, if dotencode is
                 True. Parameter path is assumed to be all lowercase.
                 A segment only needs encoding if a reserved name appears as a
                 basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"
                 doesn't need encoding.
                 >>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'
                 >>> _auxencode(s.split(b'/'), True)
                 ['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']
                 >>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'
                 >>> _auxencode(s.split(b'/'), False)
                 ['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']
                 >>> _auxencode([b'foo. '], True)
                 ['foo.~20']
                 >>> _auxencode([b' .foo'], True)
                 ['~20.foo']
                 """
                 for i, n in enumerate(path):
                     if not n:
                         continue
                     if dotencode and n[0] in b'. ':
                         n = b"~%02x" % ord(n[0:1]) + n[1:]
                         path[i] = n
                     else:
                         l = n.find(b'.')
                         if l == -1:
                             l = len(n)
                         if (l == 3 and n[:3] in _winres3) or (
                             l == 4
                             and n[3:4] <= b'9'
                             and n[3:4] >= b'1'
                             and n[:3] in _winres4
                         ):
                             # encode third letter ('aux' -> 'au~78')
                             ec = b"~%02x" % ord(n[2:3])
                             n = n[0:2] + ec + n[3:]
                             path[i] = n
                     if n[-1] in b'. ':
                         # encode last period or space ('foo...' -> 'foo..~2e')
                         path[i] = n[:-1] + b"~%02x" % ord(n[-1:])
                 return path
             _maxstorepathlen = 120
             _dirprefixlen = 8
             _maxshortdirslen = 8 * (_dirprefixlen + 1) - 4
             def _hashencode(path, dotencode):
                 digest = hex(hashutil.sha1(path).digest())
                 le = lowerencode(path[5:]).split(b'/')  # skips prefix 'data/' or 'meta/'
                 parts = _auxencode(le, dotencode)
                 basename = parts[-1]
                 _root, ext = os.path.splitext(basename)
                 sdirs = []
                 sdirslen = 0
                 for p in parts[:-1]:
                     d = p[:_dirprefixlen]
                     if d[-1] in b'. ':
                         # Windows can't access dirs ending in period or space
                         d = d[:-1] + b'_'
                     if sdirslen == 0:
                         t = len(d)
                     else:
                         t = sdirslen + 1 + len(d)
                         if t > _maxshortdirslen:
                             break
                     sdirs.append(d)
                     sdirslen = t
                 dirs = b'/'.join(sdirs)
                 if len(dirs) > 0:
                     dirs += b'/'
                 res = b'dh/' + dirs + digest + ext
                 spaceleft = _maxstorepathlen - len(res)
                 if spaceleft > 0:
                     filler = basename[:spaceleft]
                     res = b'dh/' + dirs + filler + digest + ext
                 return res
             def _hybridencode(path, dotencode):
                 """encodes path with a length limit
                 Encodes all paths that begin with 'data/', according to the following.
                 Default encoding (reversible):
                 Encodes all uppercase letters 'X' as '_x'. All reserved or illegal
                 characters are encoded as '~xx', where xx is the two digit hex code
                 of the character (see encodefilename).
                 Relevant path components consisting of Windows reserved filenames are
                 masked by encoding the third character ('aux' -> 'au~78', see _auxencode).
                 Hashed encoding (not reversible):
                 If the default-encoded path is longer than _maxstorepathlen, a
                 non-reversible hybrid hashing of the path is done instead.
                 This encoding uses up to _dirprefixlen characters of all directory
                 levels of the lowerencoded path, but not more levels than can fit into
                 _maxshortdirslen.
                 Then follows the filler followed by the sha digest of the full path.
                 The filler is the beginning of the basename of the lowerencoded path
                 (the basename is everything after the last path separator). The filler
                 is as long as possible, filling in characters from the basename until
                 the encoded path has _maxstorepathlen characters (or all chars of the
                 basename have been taken).
                 The extension (e.g. '.i' or '.d') is preserved.
                 The string 'data/' at the beginning is replaced with 'dh/', if the hashed
                 encoding was used.
                 """
                 path = encodedir(path)
                 ef = _encodefname(path).split(b'/')
                 res = b'/'.join(_auxencode(ef, dotencode))
                 if len(res) > _maxstorepathlen:
                     res = _hashencode(path, dotencode)
                 return res
             def _pathencode(path):
                 de = encodedir(path)
                 if len(path) > _maxstorepathlen:
                     return _hashencode(de, True)
                 ef = _encodefname(de).split(b'/')
                 res = b'/'.join(_auxencode(ef, True))
                 if len(res) > _maxstorepathlen:
                     return _hashencode(de, True)
                 return res
             _pathencode = getattr(parsers, 'pathencode', _pathencode)
             def _plainhybridencode(f):
                 return _hybridencode(f, False)
             def _calcmode(vfs):
                 try:
                     # files in .hg/ will be created using this mode
                     mode = vfs.stat().st_mode
                     # avoid some useless chmods
                     if (0o777 & ~util.umask) == (0o777 & mode):
                         mode = None
                 except OSError:
                     mode = None
                 return mode
             _data = [
                 b'bookmarks',
                 b'narrowspec',
                 b'data',
                 b'meta',
                 b'00manifest.d',
                 b'00manifest.i',
                 b'00changelog.d',
                 b'00changelog.i',
                 b'phaseroots',
                 b'obsstore',
                 b'requires',
             ]
             REVLOG_FILES_EXT = (
                 b'.i',
                 b'.idx',
                 b'.d',
                 b'.dat',
                 b'.n',
                 b'.nd',
                 b'.sda',
             )
             # file extension that also use a `-SOMELONGIDHASH.ext` form
             REVLOG_FILES_LONG_EXT = (
                 b'.nd',
                 b'.idx',
                 b'.dat',
                 b'.sda',
             )
             # files that are "volatile" and might change between listing and streaming
             #
             # note: the ".nd" file are nodemap data and won't "change" but they might be
             # deleted.
             REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')
             # some exception to the above matching
             #
             # XXX This is currently not in use because of issue6542
             EXCLUDED = re.compile(br'.*undo\.[^/]+\.(nd?|i)$')
             def is_revlog(f, kind, st):
                 if kind != stat.S_IFREG:
                     return False
                 if f.endswith(REVLOG_FILES_EXT):
                     return True
                 return False
             def is_revlog_file(f):
                 if f.endswith(REVLOG_FILES_EXT):
                     return True
                 return False
-            # the file is part of changelog data
-            FILEFLAGS_CHANGELOG = 1 << 13
-            # the file is part of manifest data
-            FILEFLAGS_MANIFESTLOG = 1 << 12
-            # the file is part of filelog data
-            FILEFLAGS_FILELOG = 1 << 11
-            # file that are not directly part of a revlog
-            FILEFLAGS_OTHER = 1 << 10
-            # the main entry point for a revlog
-            FILEFLAGS_REVLOG_MAIN = 1 << 1
-            # a secondary file for a revlog
-            FILEFLAGS_REVLOG_OTHER = 1 << 0
-            # files that are "volatile" and might change between listing and streaming
-            FILEFLAGS_VOLATILE = 1 << 20
-            FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN
-            FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER
-            FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN
-            FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER
-            FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN
-            FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER
-            FILETYPE_OTHER = FILEFLAGS_OTHER
             @attr.s(slots=True)
             class StoreFile:
                 """a file matching a store entry"""
                 unencoded_path = attr.ib()
                 _file_size = attr.ib(default=None)
                 is_volatile = attr.ib(default=False)
                 def file_size(self, vfs):
                     if self._file_size is None:
                         if vfs is None:
                             msg = b"calling vfs-less file_size without prior call: %s"
                             msg %= self.unencoded_path
                             raise error.ProgrammingError(msg)
                         try:
                             self._file_size = vfs.stat(self.unencoded_path).st_size
                         except FileNotFoundError:
                             self._file_size = 0
                     return self._file_size
                 def get_stream(self, vfs, copies):
                     """return data "stream" information for this file
                     (unencoded_file_path, content_iterator, content_size)
                     """
                     size = self.file_size(None)
                     def get_stream():
                         actual_path = copies[vfs.join(self.unencoded_path)]
                         with open(actual_path, 'rb') as fp:
                             yield None  # ready to stream
                             if size <= 65536:
                                 yield fp.read(size)
                             else:
                                 yield from util.filechunkiter(fp, limit=size)
                     s = get_stream()
                     next(s)
                     return (self.unencoded_path, s, size)
             @attr.s(slots=True, init=False)
             class BaseStoreEntry:
                 """An entry in the store
                 This is returned by `store.walk` and represent some data in the store."""
                 def files(self) -> List[StoreFile]:
                     raise NotImplementedError
                 def get_streams(
                     self,
                     repo=None,
                     vfs=None,
                     copies=None,
                     max_changeset=None,
                 ):
                     """return a list of data stream associated to files for this entry
                     return [(unencoded_file_path, content_iterator, content_size), …]
                     """
                     assert vfs is not None
                     return [f.get_stream(vfs, copies) for f in self.files()]
             @attr.s(slots=True, init=False)
             class SimpleStoreEntry(BaseStoreEntry):
                 """A generic entry in the store"""
                 is_revlog = False
                 _entry_path = attr.ib()
                 _is_volatile = attr.ib(default=False)
                 _file_size = attr.ib(default=None)
                 _files = attr.ib(default=None)
                 def __init__(
                     self,
                     entry_path,
                     is_volatile=False,
                     file_size=None,
                 ):
                     super().__init__()
                     self._entry_path = entry_path
                     self._is_volatile = is_volatile
                     self._file_size = file_size
                     self._files = None
                 def files(self) -> List[StoreFile]:
                     if self._files is None:
                         self._files = [
                             StoreFile(
                                 unencoded_path=self._entry_path,
                                 file_size=self._file_size,
                                 is_volatile=self._is_volatile,
                             )
                         ]
                     return self._files
             @attr.s(slots=True, init=False)
             class RevlogStoreEntry(BaseStoreEntry):
                 """A revlog entry in the store"""
                 is_revlog = True
                 revlog_type = attr.ib(default=None)
                 target_id = attr.ib(default=None)
                 _path_prefix = attr.ib(default=None)
                 _details = attr.ib(default=None)
                 _files = attr.ib(default=None)
                 def __init__(
                     self,
                     revlog_type,
                     path_prefix,
                     target_id,
                     details,
                 ):
                     super().__init__()
                     self.revlog_type = revlog_type
                     self.target_id = target_id
                     self._path_prefix = path_prefix
                     assert b'.i' in details, (path_prefix, details)
                     self._details = details
                     self._files = None
                 @property
                 def is_changelog(self):
-                    return self.revlog_type & FILEFLAGS_CHANGELOG
+                    return self.revlog_type == KIND_CHANGELOG
                 @property
                 def is_manifestlog(self):
-                    return self.revlog_type & FILEFLAGS_MANIFESTLOG
+                    return self.revlog_type == KIND_MANIFESTLOG
                 @property
                 def is_filelog(self):
-                    return self.revlog_type & FILEFLAGS_FILELOG
+                    return self.revlog_type == KIND_FILELOG
                 def main_file_path(self):
                     """unencoded path of the main revlog file"""
                     return self._path_prefix + b'.i'
                 def files(self) -> List[StoreFile]:
                     if self._files is None:
                         self._files = []
                         for ext in sorted(self._details, key=_ext_key):
                             path = self._path_prefix + ext
                             file_size = self._details[ext]
                             # files that are "volatile" and might change between
                             # listing and streaming
                             #
                             # note: the ".nd" file are nodemap data and won't "change"
                             # but they might be deleted.
                             volatile = ext.endswith(REVLOG_FILES_VOLATILE_EXT)
                             f = StoreFile(path, file_size, volatile)
                             self._files.append(f)
                     return self._files
                 def get_streams(
                     self,
                     repo=None,
                     vfs=None,
                     copies=None,
                     max_changeset=None,
                 ):
                     if (
                         repo is None
                         or max_changeset is None
                         # This use revlog-v2, ignore for now
                         or any(k.endswith(b'.idx') for k in self._details.keys())
                         # This is not inline, no race expected
                         or b'.d' in self._details
                     ):
                         return super().get_streams(
                             repo=repo,
                             vfs=vfs,
                             copies=copies,
                             max_changeset=max_changeset,
                         )
                     name_to_size = {}
                     for f in self.files():
                         name_to_size[f.unencoded_path] = f.file_size(None)
                     stream = [
                         f.get_stream(vfs, copies)
                         for f in self.files()
                         if not f.unencoded_path.endswith(b'.i')
                     ]
                     index_path = self._path_prefix + b'.i'
                     index_file = None
                     try:
                         index_file = vfs(index_path)
                         header = index_file.read(INDEX_HEADER.size)
                         if revlogmod.revlog.is_inline_index(header):
                             size = name_to_size[index_path]
                             # no split underneath, just return the stream
                             def get_stream():
                                 fp = index_file
                                 try:
                                     fp.seek(0)
                                     yield None
                                     if size <= 65536:
                                         yield fp.read(size)
                                     else:
                                         yield from util.filechunkiter(fp, limit=size)
                                 finally:
                                     fp.close()
                             s = get_stream()
                             next(s)
                             index_file = None
                             stream.append((index_path, s, size))
                         else:
                             rl = self.get_revlog_instance(repo).get_revlog()
                             rl_stream = rl.get_streams(max_changeset, force_inline=True)
                             for name, s, size in rl_stream:
                                 if name_to_size.get(name, 0) != size:
                                     msg = _(b"expected %d bytes but %d provided for %s")
                                     msg %= name_to_size.get(name, 0), size, name
                                     raise error.Abort(msg)
                             stream.extend(rl_stream)
                     finally:
                         if index_file is not None:
                             index_file.close()
                     files = self.files()
                     assert len(stream) == len(files), (
                         stream,
                         files,
                         self._path_prefix,
                         self.target_id,
                     )
                     return stream
                 def get_revlog_instance(self, repo):
                     """Obtain a revlog instance from this store entry
                     An instance of the appropriate class is returned.
                     """
                     if self.is_changelog:
                         return changelog.changelog(repo.svfs)
                     elif self.is_manifestlog:
                         mandir = self.target_id
                         return manifest.manifestrevlog(
                             repo.nodeconstants, repo.svfs, tree=mandir
                         )
                     else:
                         return filelog.filelog(repo.svfs, self.target_id)
             def _gather_revlog(files_data):
                 """group files per revlog prefix
                 The returns a two level nested dict. The top level key is the revlog prefix
                 without extension, the second level is all the file "suffix" that were
                 seen for this revlog and arbitrary file data as value.
                 """
                 revlogs = collections.defaultdict(dict)
                 for u, value in files_data:
                     name, ext = _split_revlog_ext(u)
                     revlogs[name][ext] = value
                 return sorted(revlogs.items())
             def _split_revlog_ext(filename):
                 """split the revlog file prefix from the variable extension"""
                 if filename.endswith(REVLOG_FILES_LONG_EXT):
                     char = b'-'
                 else:
                     char = b'.'
                 idx = filename.rfind(char)
                 return filename[:idx], filename[idx:]
             def _ext_key(ext):
                 """a key to order revlog suffix
                 important to issue .i after other entry."""
                 # the only important part of this order is to keep the `.i` last.
                 if ext.endswith(b'.n'):
                     return (0, ext)
                 elif ext.endswith(b'.nd'):
                     return (10, ext)
                 elif ext.endswith(b'.d'):
                     return (20, ext)
                 elif ext.endswith(b'.i'):
                     return (50, ext)
                 else:
                     return (40, ext)
             class basicstore:
                 '''base class for local repository stores'''
                 def __init__(self, path, vfstype):
                     vfs = vfstype(path)
                     self.path = vfs.base
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     self.vfs = vfsmod.filtervfs(vfs, encodedir)
                     self.opener = self.vfs
                 def join(self, f):
                     return self.path + b'/' + encodedir(f)
                 def _walk(self, relpath, recurse, undecodable=None):
                     '''yields (revlog_type, unencoded, size)'''
                     path = self.path
                     if relpath:
                         path += b'/' + relpath
                     striplen = len(self.path) + 1
                     l = []
                     if self.rawvfs.isdir(path):
                         visit = [path]
                         readdir = self.rawvfs.readdir
                         while visit:
                             p = visit.pop()
                             for f, kind, st in readdir(p, stat=True):
                                 fp = p + b'/' + f
                                 if is_revlog(f, kind, st):
                                     n = util.pconvert(fp[striplen:])
                                     l.append((decodedir(n), st.st_size))
                                 elif kind == stat.S_IFDIR and recurse:
                                     visit.append(fp)
                     l.sort()
                     return l
                 def changelog(self, trypending, concurrencychecker=None):
                     return changelog.changelog(
                         self.vfs,
                         trypending=trypending,
                         concurrencychecker=concurrencychecker,
                     )
                 def manifestlog(self, repo, storenarrowmatch):
                     rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)
                     return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)
                 def data_entries(
                     self, matcher=None, undecodable=None
                 ) -> Generator[BaseStoreEntry, None, None]:
                     """Like walk, but excluding the changelog and root manifest.
                     When [undecodable] is None, revlogs names that can't be
                     decoded cause an exception. When it is provided, it should
                     be a list and the filenames that can't be decoded are added
                     to it instead. This is very rarely needed."""
                     dirs = [
-                        (b'data', FILEFLAGS_FILELOG, False),
+                        (b'data', KIND_FILELOG, False),
-                        (b'meta', FILEFLAGS_MANIFESTLOG, True),
+                        (b'meta', KIND_MANIFESTLOG, True),
                     ]
                     for base_dir, rl_type, strip_filename in dirs:
                         files = self._walk(base_dir, True, undecodable=undecodable)
                         for revlog, details in _gather_revlog(files):
                             revlog_target_id = revlog.split(b'/', 1)[1]
                             if strip_filename and b'/' in revlog:
                                 revlog_target_id = revlog_target_id.rsplit(b'/', 1)[0]
                                 revlog_target_id += b'/'
                             yield RevlogStoreEntry(
                                 path_prefix=revlog,
                                 revlog_type=rl_type,
                                 target_id=revlog_target_id,
                                 details=details,
                             )
                 def top_entries(
                     self, phase=False, obsolescence=False
                 ) -> Generator[BaseStoreEntry, None, None]:
                     if phase and self.vfs.exists(b'phaseroots'):
                         yield SimpleStoreEntry(
                             entry_path=b'phaseroots',
                             is_volatile=True,
                         )
                     if obsolescence and self.vfs.exists(b'obsstore'):
                         # XXX if we had the file size it could be non-volatile
                         yield SimpleStoreEntry(
                             entry_path=b'obsstore',
                             is_volatile=True,
                         )
                     files = reversed(self._walk(b'', False))
                     changelogs = collections.defaultdict(dict)
                     manifestlogs = collections.defaultdict(dict)
                     for u, s in files:
                         if u.startswith(b'00changelog'):
                             name, ext = _split_revlog_ext(u)
                             changelogs[name][ext] = s
                         elif u.startswith(b'00manifest'):
                             name, ext = _split_revlog_ext(u)
                             manifestlogs[name][ext] = s
                         else:
                             yield SimpleStoreEntry(
                                 entry_path=u,
                                 is_volatile=False,
                                 file_size=s,
                             )
                     # yield manifest before changelog
                     top_rl = [
-                        (manifestlogs, FILEFLAGS_MANIFESTLOG),
+                        (manifestlogs, KIND_MANIFESTLOG),
-                        (changelogs, FILEFLAGS_CHANGELOG),
+                        (changelogs, KIND_CHANGELOG),
                     ]
                     assert len(manifestlogs) <= 1
                     assert len(changelogs) <= 1
                     for data, revlog_type in top_rl:
                         for revlog, details in sorted(data.items()):
                             yield RevlogStoreEntry(
                                 path_prefix=revlog,
                                 revlog_type=revlog_type,
                                 target_id=b'',
                                 details=details,
                             )
                 def walk(
                     self, matcher=None, phase=False, obsolescence=False
                 ) -> Generator[BaseStoreEntry, None, None]:
                     """return files related to data storage (ie: revlogs)
                     yields instance from BaseStoreEntry subclasses
                     if a matcher is passed, storage files of only those tracked paths
                     are passed with matches the matcher
                     """
                     # yield data files first
                     for x in self.data_entries(matcher):
                         yield x
                     for x in self.top_entries(phase=phase, obsolescence=obsolescence):
                         yield x
                 def copylist(self):
                     return _data
                 def write(self, tr):
                     pass
                 def invalidatecaches(self):
                     pass
                 def markremoved(self, fn):
                     pass
                 def __contains__(self, path):
                     '''Checks if the store contains path'''
                     path = b"/".join((b"data", path))
                     # file?
                     if self.vfs.exists(path + b".i"):
                         return True
                     # dir?
                     if not path.endswith(b"/"):
                         path = path + b"/"
                     return self.vfs.exists(path)
             class encodedstore(basicstore):
                 def __init__(self, path, vfstype):
                     vfs = vfstype(path + b'/store')
                     self.path = vfs.base
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     self.vfs = vfsmod.filtervfs(vfs, encodefilename)
                     self.opener = self.vfs
                 def _walk(self, relpath, recurse, undecodable=None):
                     old = super()._walk(relpath, recurse)
                     new = []
                     for f1, value in old:
                         try:
                             f2 = decodefilename(f1)
                         except KeyError:
                             if undecodable is None:
                                 msg = _(b'undecodable revlog name %s') % f1
                                 raise error.StorageError(msg)
                             else:
                                 undecodable.append(f1)
                                 continue
                         new.append((f2, value))
                     return new
                 def data_entries(
                     self, matcher=None, undecodable=None
                 ) -> Generator[BaseStoreEntry, None, None]:
                     entries = super(encodedstore, self).data_entries(
                         undecodable=undecodable
                     )
                     for entry in entries:
                         if _match_tracked_entry(entry, matcher):
                             yield entry
                 def join(self, f):
                     return self.path + b'/' + encodefilename(f)
                 def copylist(self):
                     return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]
             class fncache:
                 # the filename used to be partially encoded
                 # hence the encodedir/decodedir dance
                 def __init__(self, vfs):
                     self.vfs = vfs
                     self._ignores = set()
                     self.entries = None
                     self._dirty = False
                     # set of new additions to fncache
                     self.addls = set()
                 def ensureloaded(self, warn=None):
                     """read the fncache file if not already read.
                     If the file on disk is corrupted, raise. If warn is provided,
                     warn and keep going instead."""
                     if self.entries is None:
                         self._load(warn)
                 def _load(self, warn=None):
                     '''fill the entries from the fncache file'''
                     self._dirty = False
                     try:
                         fp = self.vfs(b'fncache', mode=b'rb')
                     except IOError:
                         # skip nonexistent file
                         self.entries = set()
                         return
                     self.entries = set()
                     chunk = b''
                     for c in iter(functools.partial(fp.read, fncache_chunksize), b''):
                         chunk += c
                         try:
                             p = chunk.rindex(b'\n')
                             self.entries.update(decodedir(chunk[: p + 1]).splitlines())
                             chunk = chunk[p + 1 :]
                         except ValueError:
                             # substring '\n' not found, maybe the entry is bigger than the
                             # chunksize, so let's keep iterating
                             pass
                     if chunk:
                         msg = _(b"fncache does not ends with a newline")
                         if warn:
                             warn(msg + b'\n')
                         else:
                             raise error.Abort(
                                 msg,
                                 hint=_(
                                     b"use 'hg debugrebuildfncache' to "
                                     b"rebuild the fncache"
                                 ),
                             )
                     self._checkentries(fp, warn)
                     fp.close()
                 def _checkentries(self, fp, warn):
                     """make sure there is no empty string in entries"""
                     if b'' in self.entries:
                         fp.seek(0)
                         for n, line in enumerate(fp):
                             if not line.rstrip(b'\n'):
                                 t = _(b'invalid entry in fncache, line %d') % (n + 1)
                                 if warn:
                                     warn(t + b'\n')
                                 else:
                                     raise error.Abort(t)
                 def write(self, tr):
                     if self._dirty:
                         assert self.entries is not None
                         self.entries = self.entries | self.addls
                         self.addls = set()
                         tr.addbackup(b'fncache')
                         fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)
                         if self.entries:
                             fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))
                         fp.close()
                         self._dirty = False
                     if self.addls:
                         # if we have just new entries, let's append them to the fncache
                         tr.addbackup(b'fncache')
                         fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)
                         if self.addls:
                             fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))
                         fp.close()
                         self.entries = None
                         self.addls = set()
                 def addignore(self, fn):
                     self._ignores.add(fn)
                 def add(self, fn):
                     if fn in self._ignores:
                         return
                     if self.entries is None:
                         self._load()
                     if fn not in self.entries:
                         self.addls.add(fn)
                 def remove(self, fn):
                     if self.entries is None:
                         self._load()
                     if fn in self.addls:
                         self.addls.remove(fn)
                         return
                     try:
                         self.entries.remove(fn)
                         self._dirty = True
                     except KeyError:
                         pass
                 def __contains__(self, fn):
                     if fn in self.addls:
                         return True
                     if self.entries is None:
                         self._load()
                     return fn in self.entries
                 def __iter__(self):
                     if self.entries is None:
                         self._load()
                     return iter(self.entries | self.addls)
             class _fncachevfs(vfsmod.proxyvfs):
                 def __init__(self, vfs, fnc, encode):
                     vfsmod.proxyvfs.__init__(self, vfs)
                     self.fncache = fnc
                     self.encode = encode
                 def __call__(self, path, mode=b'r', *args, **kw):
                     encoded = self.encode(path)
                     if (
                         mode not in (b'r', b'rb')
                         and (path.startswith(b'data/') or path.startswith(b'meta/'))
                         and is_revlog_file(path)
                     ):
                         # do not trigger a fncache load when adding a file that already is
                         # known to exist.
                         notload = self.fncache.entries is None and self.vfs.exists(encoded)
                         if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:
                             # when appending to an existing file, if the file has size zero,
                             # it should be considered as missing. Such zero-size files are
                             # the result of truncation when a transaction is aborted.
                             notload = False
                         if not notload:
                             self.fncache.add(path)
                     return self.vfs(encoded, mode, *args, **kw)
                 def join(self, path):
                     if path:
                         return self.vfs.join(self.encode(path))
                     else:
                         return self.vfs.join(path)
                 def register_file(self, path):
                     """generic hook point to lets fncache steer its stew"""
                     if path.startswith(b'data/') or path.startswith(b'meta/'):
                         self.fncache.add(path)
             class fncachestore(basicstore):
                 def __init__(self, path, vfstype, dotencode):
                     if dotencode:
                         encode = _pathencode
                     else:
                         encode = _plainhybridencode
                     self.encode = encode
                     vfs = vfstype(path + b'/store')
                     self.path = vfs.base
                     self.pathsep = self.path + b'/'
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     fnc = fncache(vfs)
                     self.fncache = fnc
                     self.vfs = _fncachevfs(vfs, fnc, encode)
                     self.opener = self.vfs
                 def join(self, f):
                     return self.pathsep + self.encode(f)
                 def getsize(self, path):
                     return self.rawvfs.stat(path).st_size
                 def data_entries(
                     self, matcher=None, undecodable=None
                 ) -> Generator[BaseStoreEntry, None, None]:
                     # Note: all files in fncache should be revlog related, However the
                     # fncache might contains such file added by previous version of
                     # Mercurial.
                     files = ((f, None) for f in self.fncache if is_revlog_file(f))
                     by_revlog = _gather_revlog(files)
                     for revlog, details in by_revlog:
                         if revlog.startswith(b'data/'):
-                            rl_type = FILEFLAGS_FILELOG
+                            rl_type = KIND_FILELOG
                             revlog_target_id = revlog.split(b'/', 1)[1]
                         elif revlog.startswith(b'meta/'):
-                            rl_type = FILEFLAGS_MANIFESTLOG
+                            rl_type = KIND_MANIFESTLOG
                             # drop the initial directory and the `00manifest` file part
                             tmp = revlog.split(b'/', 1)[1]
                             revlog_target_id = tmp.rsplit(b'/', 1)[0] + b'/'
                         else:
                             # unreachable
                             assert False, revlog
                         entry = RevlogStoreEntry(
                             path_prefix=revlog,
                             revlog_type=rl_type,
                             target_id=revlog_target_id,
                             details=details,
                         )
                         if _match_tracked_entry(entry, matcher):
                             yield entry
                 def copylist(self):
                     d = (
                         b'bookmarks',
                         b'narrowspec',
                         b'data',
                         b'meta',
                         b'dh',
                         b'fncache',
                         b'phaseroots',
                         b'obsstore',
                         b'00manifest.d',
                         b'00manifest.i',
                         b'00changelog.d',
                         b'00changelog.i',
                         b'requires',
                     )
                     return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]
                 def write(self, tr):
                     self.fncache.write(tr)
                 def invalidatecaches(self):
                     self.fncache.entries = None
                     self.fncache.addls = set()
                 def markremoved(self, fn):
                     self.fncache.remove(fn)
                 def _exists(self, f):
                     ef = self.encode(f)
                     try:
                         self.getsize(ef)
                         return True
                     except FileNotFoundError:
                         return False
                 def __contains__(self, path):
                     '''Checks if the store contains path'''
                     path = b"/".join((b"data", path))
                     # check for files (exact match)
                     e = path + b'.i'
                     if e in self.fncache and self._exists(e):
                         return True
                     # now check for directories (prefix match)
                     if not path.endswith(b'/'):
                         path += b'/'
                     for e in self.fncache:
                         if e.startswith(path) and self._exists(e):
                             return True
                     return False