upstream/mercurial-mirror Commit - r46864:a3ccbac6

1

# manifest.py - manifest revision class for mercurial

1

# manifest.py - manifest revision class for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import heapq

10

import heapq

11

import itertools

11

import itertools

12

import struct

12

import struct

13

import weakref

13

import weakref

14

15

from .i18n import _

15

from .i18n import _

16

from .node import (

16

from .node import (

17

bin,

17

bin,

18

hex,

18

hex,

19

nullid,

19

nullid,

20

nullrev,

20

nullrev,

21

)

21

)

22

from .pycompat import getattr

22

from .pycompat import getattr

23

from . import (

23

from . import (

24

encoding,

24

encoding,

25

error,

25

error,

26

match as matchmod,

26

match as matchmod,

27

mdiff,

27

mdiff,

28

pathutil,

28

pathutil,

29

policy,

29

policy,

30

pycompat,

30

pycompat,

31

revlog,

31

revlog,

32

util,

32

util,

33

)

33

)

34

from .interfaces import (

34

from .interfaces import (

35

repository,

35

repository,

36

util as interfaceutil,

36

util as interfaceutil,

37

)

37

)

38

39

parsers = policy.importmod('parsers')

39

parsers = policy.importmod('parsers')

40

propertycache = util.propertycache

40

propertycache = util.propertycache

41

42

# Allow tests to more easily test the alternate path in manifestdict.fastdelta()

42

# Allow tests to more easily test the alternate path in manifestdict.fastdelta()

43

FASTDELTA_TEXTDIFF_THRESHOLD = 1000

43

FASTDELTA_TEXTDIFF_THRESHOLD = 1000

44

45

46

def _parse(data):

46

def _parse(data):

47

# This method does a little bit of excessive-looking

47

# This method does a little bit of excessive-looking

48

# precondition checking. This is so that the behavior of this

48

# precondition checking. This is so that the behavior of this

49

# class exactly matches its C counterpart to try and help

49

# class exactly matches its C counterpart to try and help

50

# prevent surprise breakage for anyone that develops against

50

# prevent surprise breakage for anyone that develops against

51

# the pure version.

51

# the pure version.

52

if data and data[-1:] != b'\n':

52

if data and data[-1:] != b'\n':

53

raise ValueError(b'Manifest did not end in a newline.')

53

raise ValueError(b'Manifest did not end in a newline.')

54

prev = None

54

prev = None

55

for l in data.splitlines():

55

for l in data.splitlines():

56

if prev is not None and prev > l:

56

if prev is not None and prev > l:

57

raise ValueError(b'Manifest lines not in sorted order.')

57

raise ValueError(b'Manifest lines not in sorted order.')

58

prev = l

58

prev = l

59

f, n = l.split(b'\0')

59

f, n = l.split(b'\0')

60

nl = len(n)

60

nl = len(n)

61

flags = n[-1:]

61

flags = n[-1:]

62

if flags in _manifestflags:

62

if flags in _manifestflags:

63

n = n[:-1]

63

n = n[:-1]

64

nl -= 1

64

nl -= 1

65

else:

65

else:

66

flags = b''

66

flags = b''

67

if nl not in (40, 64):

67

if nl not in (40, 64):

68

raise ValueError(b'Invalid manifest line')

68

raise ValueError(b'Invalid manifest line')

69

70

yield f, bin(n), flags

70

yield f, bin(n), flags

71

72

73

def _text(it):

73

def _text(it):

74

files = []

74

files = []

75

lines = []

75

lines = []

76

for f, n, fl in it:

76

for f, n, fl in it:

77

files.append(f)

77

files.append(f)

78

# if this is changed to support newlines in filenames,

78

# if this is changed to support newlines in filenames,

79

# be sure to check the templates/ dir again (especially *-raw.tmpl)

79

# be sure to check the templates/ dir again (especially *-raw.tmpl)

80

lines.append(b"%s\0%s%s\n" % (f, hex(n), fl))

80

lines.append(b"%s\0%s%s\n" % (f, hex(n), fl))

81

82

_checkforbidden(files)

82

_checkforbidden(files)

83

return b''.join(lines)

83

return b''.join(lines)

84

85

86

class lazymanifestiter(object):

86

class lazymanifestiter(object):

87

def __init__(self, lm):

87

def __init__(self, lm):

88

self.pos = 0

88

self.pos = 0

89

self.lm = lm

89

self.lm = lm

90

91

def __iter__(self):

91

def __iter__(self):

92

return self

92

return self

93

94

def next(self):

94

def next(self):

95

try:

95

try:

96

data, pos = self.lm._get(self.pos)

96

data, pos = self.lm._get(self.pos)

97

except IndexError:

97

except IndexError:

98

raise StopIteration

98

raise StopIteration

99

if pos == -1:

99

if pos == -1:

100

self.pos += 1

100

self.pos += 1

101

return data[0]

101

return data[0]

102

self.pos += 1

102

self.pos += 1

103

zeropos = data.find(b'\x00', pos)

103

zeropos = data.find(b'\x00', pos)

104

return data[pos:zeropos]

104

return data[pos:zeropos]

105

106

__next__ = next

106

__next__ = next

107

108

109

class lazymanifestiterentries(object):

109

class lazymanifestiterentries(object):

110

def __init__(self, lm):

110

def __init__(self, lm):

111

self.lm = lm

111

self.lm = lm

112

self.pos = 0

112

self.pos = 0

113

114

def __iter__(self):

114

def __iter__(self):

115

return self

115

return self

116

117

def next(self):

117

def next(self):

118

try:

118

try:

119

data, pos = self.lm._get(self.pos)

119

data, pos = self.lm._get(self.pos)

120

except IndexError:

120

except IndexError:

121

raise StopIteration

121

raise StopIteration

122

if pos == -1:

122

if pos == -1:

123

self.pos += 1

123

self.pos += 1

124

return data

124

return data

125

zeropos = data.find(b'\x00', pos)

125

zeropos = data.find(b'\x00', pos)

126

nlpos = data.find(b'\n', pos)

126

nlpos = data.find(b'\n', pos)

127

if zeropos == -1 or nlpos == -1 or nlpos < zeropos:

127

if zeropos == -1 or nlpos == -1 or nlpos < zeropos:

128

raise error.StorageError(b'Invalid manifest line')

128

raise error.StorageError(b'Invalid manifest line')

129

flags = data[nlpos - 1 : nlpos]

129

flags = data[nlpos - 1 : nlpos]

130

if flags in _manifestflags:

130

if flags in _manifestflags:

131

hlen = nlpos - zeropos - 2

131

hlen = nlpos - zeropos - 2

132

else:

132

else:

133

hlen = nlpos - zeropos - 1

133

hlen = nlpos - zeropos - 1

134

flags = b''

134

flags = b''

135

if hlen not in (40, 64):

135

if hlen not in (40, 64):

136

raise error.StorageError(b'Invalid manifest line')

136

raise error.StorageError(b'Invalid manifest line')

137

hashval = unhexlify(

137

hashval = unhexlify(

138

data, self.lm.extrainfo[self.pos], zeropos + 1, hlen

138

data, self.lm.extrainfo[self.pos], zeropos + 1, hlen

139

)

139

)

140

self.pos += 1

140

self.pos += 1

141

return (data[pos:zeropos], hashval, flags)

141

return (data[pos:zeropos], hashval, flags)

142

143

__next__ = next

143

__next__ = next

144

145

146

def unhexlify(data, extra, pos, length):

146

def unhexlify(data, extra, pos, length):

147

s = bin(data[pos : pos + length])

147

s = bin(data[pos : pos + length])

148

if extra:

148

if extra:

149

s += chr(extra & 0xFF)

149

s += chr(extra & 0xFF)

150

return s

150

return s

151

152

153

def _cmp(a, b):

153

def _cmp(a, b):

154

return (a > b) - (a < b)

154

return (a > b) - (a < b)

155

156

157

_manifestflags = {b'', b'l', b't', b'x'}

157

_manifestflags = {b'', b'l', b't', b'x'}

158

159

160

class _lazymanifest(object):

160

class _lazymanifest(object):

161

"""A pure python manifest backed by a byte string. It is supplimented with

161

"""A pure python manifest backed by a byte string. It is supplimented with

162

internal lists as it is modified, until it is compacted back to a pure byte

162

internal lists as it is modified, until it is compacted back to a pure byte

163

string.

163

string.

164

165

``data`` is the initial manifest data.

165

``data`` is the initial manifest data.

166

167

``positions`` is a list of offsets, one per manifest entry. Positive

167

``positions`` is a list of offsets, one per manifest entry. Positive

168

values are offsets into ``data``, negative values are offsets into the

168

values are offsets into ``data``, negative values are offsets into the

169

``extradata`` list. When an entry is removed, its entry is dropped from

169

``extradata`` list. When an entry is removed, its entry is dropped from

170

``positions``. The values are encoded such that when walking the list and

170

``positions``. The values are encoded such that when walking the list and

171

indexing into ``data`` or ``extradata`` as appropriate, the entries are

171

indexing into ``data`` or ``extradata`` as appropriate, the entries are

172

sorted by filename.

172

sorted by filename.

173

174

``extradata`` is a list of (key, hash, flags) for entries that were added or

174

``extradata`` is a list of (key, hash, flags) for entries that were added or

175

modified since the manifest was created or compacted.

175

modified since the manifest was created or compacted.

176

"""

176

"""

177

178

def __init__(

178

def __init__(

179

self,

179

self,

180

data,

180

data,

181

positions=None,

181

positions=None,

182

extrainfo=None,

182

extrainfo=None,

183

extradata=None,

183

extradata=None,

184

hasremovals=False,

184

hasremovals=False,

185

):

185

):

186

if positions is None:

186

if positions is None:

187

self.positions = self.findlines(data)

187

self.positions = self.findlines(data)

188

self.extrainfo = [0] * len(self.positions)

188

self.extrainfo = [0] * len(self.positions)

189

self.data = data

189

self.data = data

190

self.extradata = []

190

self.extradata = []

191

self.hasremovals = False

191

self.hasremovals = False

192

else:

192

else:

193

self.positions = positions[:]

193

self.positions = positions[:]

194

self.extrainfo = extrainfo[:]

194

self.extrainfo = extrainfo[:]

195

self.extradata = extradata[:]

195

self.extradata = extradata[:]

196

self.data = data

196

self.data = data

197

self.hasremovals = hasremovals

197

self.hasremovals = hasremovals

198

199

def findlines(self, data):

199

def findlines(self, data):

200

if not data:

200

if not data:

201

return []

201

return []

202

pos = data.find(b"\n")

202

pos = data.find(b"\n")

203

if pos == -1 or data[-1:] != b'\n':

203

if pos == -1 or data[-1:] != b'\n':

204

raise ValueError(b"Manifest did not end in a newline.")

204

raise ValueError(b"Manifest did not end in a newline.")

205

positions = [0]

205

positions = [0]

206

prev = data[: data.find(b'\x00')]

206

prev = data[: data.find(b'\x00')]

207

while pos < len(data) - 1 and pos != -1:

207

while pos < len(data) - 1 and pos != -1:

208

positions.append(pos + 1)

208

positions.append(pos + 1)

209

nexts = data[pos + 1 : data.find(b'\x00', pos + 1)]

209

nexts = data[pos + 1 : data.find(b'\x00', pos + 1)]

210

if nexts < prev:

210

if nexts < prev:

211

raise ValueError(b"Manifest lines not in sorted order.")

211

raise ValueError(b"Manifest lines not in sorted order.")

212

prev = nexts

212

prev = nexts

213

pos = data.find(b"\n", pos + 1)

213

pos = data.find(b"\n", pos + 1)

214

return positions

214

return positions

215

216

def _get(self, index):

216

def _get(self, index):

217

# get the position encoded in pos:

217

# get the position encoded in pos:

218

# positive number is an index in 'data'

218

# positive number is an index in 'data'

219

# negative number is in extrapieces

219

# negative number is in extrapieces

220

pos = self.positions[index]

220

pos = self.positions[index]

221

if pos >= 0:

221

if pos >= 0:

222

return self.data, pos

222

return self.data, pos

223

return self.extradata[-pos - 1], -1

223

return self.extradata[-pos - 1], -1

224

225

def _getkey(self, pos):

225

def _getkey(self, pos):

226

if pos >= 0:

226

if pos >= 0:

227

return self.data[pos : self.data.find(b'\x00', pos + 1)]

227

return self.data[pos : self.data.find(b'\x00', pos + 1)]

228

return self.extradata[-pos - 1][0]

228

return self.extradata[-pos - 1][0]

229

230

def bsearch(self, key):

230

def bsearch(self, key):

231

first = 0

231

first = 0

232

last = len(self.positions) - 1

232

last = len(self.positions) - 1

233

234

while first <= last:

234

while first <= last:

235

midpoint = (first + last) // 2

235

midpoint = (first + last) // 2

236

nextpos = self.positions[midpoint]

236

nextpos = self.positions[midpoint]

237

candidate = self._getkey(nextpos)

237

candidate = self._getkey(nextpos)

238

r = _cmp(key, candidate)

238

r = _cmp(key, candidate)

239

if r == 0:

239

if r == 0:

240

return midpoint

240

return midpoint

241

else:

241

else:

242

if r < 0:

242

if r < 0:

243

last = midpoint - 1

243

last = midpoint - 1

244

else:

244

else:

245

first = midpoint + 1

245

first = midpoint + 1

246

return -1

246

return -1

247

248

def bsearch2(self, key):

248

def bsearch2(self, key):

249

# same as the above, but will always return the position

249

# same as the above, but will always return the position

250

# done for performance reasons

250

# done for performance reasons

251

first = 0

251

first = 0

252

last = len(self.positions) - 1

252

last = len(self.positions) - 1

253

254

while first <= last:

254

while first <= last:

255

midpoint = (first + last) // 2

255

midpoint = (first + last) // 2

256

nextpos = self.positions[midpoint]

256

nextpos = self.positions[midpoint]

257

candidate = self._getkey(nextpos)

257

candidate = self._getkey(nextpos)

258

r = _cmp(key, candidate)

258

r = _cmp(key, candidate)

259

if r == 0:

259

if r == 0:

260

return (midpoint, True)

260

return (midpoint, True)

261

else:

261

else:

262

if r < 0:

262

if r < 0:

263

last = midpoint - 1

263

last = midpoint - 1

264

else:

264

else:

265

first = midpoint + 1

265

first = midpoint + 1

266

return (first, False)

266

return (first, False)

267

268

def __contains__(self, key):

268

def __contains__(self, key):

269

return self.bsearch(key) != -1

269

return self.bsearch(key) != -1

270

271

def __getitem__(self, key):

271

def __getitem__(self, key):

272

if not isinstance(key, bytes):

272

if not isinstance(key, bytes):

273

raise TypeError(b"getitem: manifest keys must be a bytes.")

273

raise TypeError(b"getitem: manifest keys must be a bytes.")

274

needle = self.bsearch(key)

274

needle = self.bsearch(key)

275

if needle == -1:

275

if needle == -1:

276

raise KeyError

276

raise KeyError

277

data, pos = self._get(needle)

277

data, pos = self._get(needle)

278

if pos == -1:

278

if pos == -1:

279

return (data[1], data[2])

279

return (data[1], data[2])

280

zeropos = data.find(b'\x00', pos)

280

zeropos = data.find(b'\x00', pos)

281

nlpos = data.find(b'\n', zeropos)

281

nlpos = data.find(b'\n', zeropos)

282

assert 0 <= needle <= len(self.positions)

282

assert 0 <= needle <= len(self.positions)

283

assert len(self.extrainfo) == len(self.positions)

283

assert len(self.extrainfo) == len(self.positions)

284

if zeropos == -1 or nlpos == -1 or nlpos < zeropos:

284

if zeropos == -1 or nlpos == -1 or nlpos < zeropos:

285

raise error.StorageError(b'Invalid manifest line')

285

raise error.StorageError(b'Invalid manifest line')

286

hlen = nlpos - zeropos - 1

286

hlen = nlpos - zeropos - 1

287

flags = data[nlpos - 1 : nlpos]

287

flags = data[nlpos - 1 : nlpos]

288

if flags in _manifestflags:

288

if flags in _manifestflags:

289

hlen -= 1

289

hlen -= 1

290

else:

290

else:

291

flags = b''

291

flags = b''

292

if hlen not in (40, 64):

292

if hlen not in (40, 64):

293

raise error.StorageError(b'Invalid manifest line')

293

raise error.StorageError(b'Invalid manifest line')

294

hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, hlen)

294

hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, hlen)

295

return (hashval, flags)

295

return (hashval, flags)

296

297

def __delitem__(self, key):

297

def __delitem__(self, key):

298

needle, found = self.bsearch2(key)

298

needle, found = self.bsearch2(key)

299

if not found:

299

if not found:

300

raise KeyError

300

raise KeyError

301

cur = self.positions[needle]

301

cur = self.positions[needle]

302

self.positions = self.positions[:needle] + self.positions[needle + 1 :]

302

self.positions = self.positions[:needle] + self.positions[needle + 1 :]

303

self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1 :]

303

self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1 :]

304

if cur >= 0:

304

if cur >= 0:

305

# This does NOT unsort the list as far as the search functions are

305

# This does NOT unsort the list as far as the search functions are

306

# concerned, as they only examine lines mapped by self.positions.

306

# concerned, as they only examine lines mapped by self.positions.

307

self.data = self.data[:cur] + b'\x00' + self.data[cur + 1 :]

307

self.data = self.data[:cur] + b'\x00' + self.data[cur + 1 :]

308

self.hasremovals = True

308

self.hasremovals = True

309

310

def __setitem__(self, key, value):

310

def __setitem__(self, key, value):

311

if not isinstance(key, bytes):

311

if not isinstance(key, bytes):

312

raise TypeError(b"setitem: manifest keys must be a byte string.")

312

raise TypeError(b"setitem: manifest keys must be a byte string.")

313

if not isinstance(value, tuple) or len(value) != 2:

313

if not isinstance(value, tuple) or len(value) != 2:

314

raise TypeError(

314

raise TypeError(

315

b"Manifest values must be a tuple of (node, flags)."

315

b"Manifest values must be a tuple of (node, flags)."

316

)

316

)

317

hashval = value[0]

317

hashval = value[0]

318

if not isinstance(hashval, bytes) or len(hashval) not in (20, 32):

318

if not isinstance(hashval, bytes) or len(hashval) not in (20, 32):

319

raise TypeError(b"node must be a 20-byte or 32-byte byte string")

319

raise TypeError(b"node must be a 20-byte or 32-byte byte string")

320

flags = value[1]

320

flags = value[1]

321

if not isinstance(flags, bytes) or len(flags) > 1:

321

if not isinstance(flags, bytes) or len(flags) > 1:

322

raise TypeError(b"flags must a 0 or 1 byte string, got %r", flags)

322

raise TypeError(b"flags must a 0 or 1 byte string, got %r", flags)

323

needle, found = self.bsearch2(key)

323

needle, found = self.bsearch2(key)

324

if found:

324

if found:

325

# put the item

325

# put the item

326

pos = self.positions[needle]

326

pos = self.positions[needle]

327

if pos < 0:

327

if pos < 0:

328

self.extradata[-pos - 1] = (key, hashval, value[1])

328

self.extradata[-pos - 1] = (key, hashval, value[1])

329

else:

329

else:

330

# just don't bother

330

# just don't bother

331

self.extradata.append((key, hashval, value[1]))

331

self.extradata.append((key, hashval, value[1]))

332

self.positions[needle] = -len(self.extradata)

332

self.positions[needle] = -len(self.extradata)

333

else:

333

else:

334

# not found, put it in with extra positions

334

# not found, put it in with extra positions

335

self.extradata.append((key, hashval, value[1]))

335

self.extradata.append((key, hashval, value[1]))

336

self.positions = (

336

self.positions = (

337

self.positions[:needle]

337

self.positions[:needle]

338

+ [-len(self.extradata)]

338

+ [-len(self.extradata)]

339

+ self.positions[needle:]

339

+ self.positions[needle:]

340

)

340

)

341

self.extrainfo = (

341

self.extrainfo = (

342

self.extrainfo[:needle] + [0] + self.extrainfo[needle:]

342

self.extrainfo[:needle] + [0] + self.extrainfo[needle:]

343

)

343

)

344

345

def copy(self):

345

def copy(self):

346

# XXX call _compact like in C?

346

# XXX call _compact like in C?

347

return _lazymanifest(

347

return _lazymanifest(

348

self.data,

348

self.data,

349

self.positions,

349

self.positions,

350

self.extrainfo,

350

self.extrainfo,

351

self.extradata,

351

self.extradata,

352

self.hasremovals,

352

self.hasremovals,

353

)

353

)

354

355

def _compact(self):

355

def _compact(self):

356

# hopefully not called TOO often

356

# hopefully not called TOO often

357

if len(self.extradata) == 0 and not self.hasremovals:

357

if len(self.extradata) == 0 and not self.hasremovals:

358

return

358

return

359

l = []

359

l = []

360

i = 0

360

i = 0

361

offset = 0

361

offset = 0

362

self.extrainfo = [0] * len(self.positions)

362

self.extrainfo = [0] * len(self.positions)

363

while i < len(self.positions):

363

while i < len(self.positions):

364

if self.positions[i] >= 0:

364

if self.positions[i] >= 0:

365

cur = self.positions[i]

365

cur = self.positions[i]

366

last_cut = cur

366

last_cut = cur

367

368

# Collect all contiguous entries in the buffer at the current

368

# Collect all contiguous entries in the buffer at the current

369

# offset, breaking out only for added/modified items held in

369

# offset, breaking out only for added/modified items held in

370

# extradata, or a deleted line prior to the next position.

370

# extradata, or a deleted line prior to the next position.

371

while True:

371

while True:

372

self.positions[i] = offset

372

self.positions[i] = offset

373

i += 1

373

i += 1

374

if i == len(self.positions) or self.positions[i] < 0:

374

if i == len(self.positions) or self.positions[i] < 0:

375

break

375

break

376

377

# A removed file has no positions[] entry, but does have an

377

# A removed file has no positions[] entry, but does have an

378

# overwritten first byte. Break out and find the end of the

378

# overwritten first byte. Break out and find the end of the

379

# current good entry/entries if there is a removed file

379

# current good entry/entries if there is a removed file

380

# before the next position.

380

# before the next position.

381

if (

381

if (

382

self.hasremovals

382

self.hasremovals

383

and self.data.find(b'\n\x00', cur, self.positions[i])

383

and self.data.find(b'\n\x00', cur, self.positions[i])

384

!= -1

384

!= -1

385

):

385

):

386

break

386

break

387

388

offset += self.positions[i] - cur

388

offset += self.positions[i] - cur

389

cur = self.positions[i]

389

cur = self.positions[i]

390

end_cut = self.data.find(b'\n', cur)

390

end_cut = self.data.find(b'\n', cur)

391

if end_cut != -1:

391

if end_cut != -1:

392

end_cut += 1

392

end_cut += 1

393

offset += end_cut - cur

393

offset += end_cut - cur

394

l.append(self.data[last_cut:end_cut])

394

l.append(self.data[last_cut:end_cut])

395

else:

395

else:

396

while i < len(self.positions) and self.positions[i] < 0:

396

while i < len(self.positions) and self.positions[i] < 0:

397

cur = self.positions[i]

397

cur = self.positions[i]

398

t = self.extradata[-cur - 1]

398

t = self.extradata[-cur - 1]

399

l.append(self._pack(t))

399

l.append(self._pack(t))

400

self.positions[i] = offset

400

self.positions[i] = offset

401

# Hashes are either 20 bytes (old sha1s) or 32

401

# Hashes are either 20 bytes (old sha1s) or 32

402

# bytes (new non-sha1).

402

# bytes (new non-sha1).

403

hlen = 20

403

hlen = 20

404

if len(t[1]) > 25:

404

if len(t[1]) > 25:

405

hlen = 32

405

hlen = 32

406

if len(t[1]) > hlen:

406

if len(t[1]) > hlen:

407

self.extrainfo[i] = ord(t[1][hlen + 1])

407

self.extrainfo[i] = ord(t[1][hlen + 1])

408

offset += len(l[-1])

408

offset += len(l[-1])

409

i += 1

409

i += 1

410

self.data = b''.join(l)

410

self.data = b''.join(l)

411

self.hasremovals = False

411

self.hasremovals = False

412

self.extradata = []

412

self.extradata = []

413

414

def _pack(self, d):

414

def _pack(self, d):

415

n = d[1]

415

n = d[1]

416

assert len(n) in (20, 32)

416

assert len(n) in (20, 32)

417

return d[0] + b'\x00' + hex(n) + d[2] + b'\n'

417

return d[0] + b'\x00' + hex(n) + d[2] + b'\n'

418

419

def text(self):

419

def text(self):

420

self._compact()

420

self._compact()

421

return self.data

421

return self.data

422

423

def diff(self, m2, clean=False):

423

def diff(self, m2, clean=False):

424

'''Finds changes between the current manifest and m2.'''

424

'''Finds changes between the current manifest and m2.'''

425

# XXX think whether efficiency matters here

425

# XXX think whether efficiency matters here

426

diff = {}

426

diff = {}

427

428

for fn, e1, flags in self.iterentries():

428

for fn, e1, flags in self.iterentries():

429

if fn not in m2:

429

if fn not in m2:

430

diff[fn] = (e1, flags), (None, b'')

430

diff[fn] = (e1, flags), (None, b'')

431

else:

431

else:

432

e2 = m2[fn]

432

e2 = m2[fn]

433

if (e1, flags) != e2:

433

if (e1, flags) != e2:

434

diff[fn] = (e1, flags), e2

434

diff[fn] = (e1, flags), e2

435

elif clean:

435

elif clean:

436

diff[fn] = None

436

diff[fn] = None

437

438

for fn, e2, flags in m2.iterentries():

438

for fn, e2, flags in m2.iterentries():

439

if fn not in self:

439

if fn not in self:

440

diff[fn] = (None, b''), (e2, flags)

440

diff[fn] = (None, b''), (e2, flags)

441

442

return diff

442

return diff

443

444

def iterentries(self):

444

def iterentries(self):

445

return lazymanifestiterentries(self)

445

return lazymanifestiterentries(self)

446

447

def iterkeys(self):

447

def iterkeys(self):

448

return lazymanifestiter(self)

448

return lazymanifestiter(self)

449

450

def __iter__(self):

450

def __iter__(self):

451

return lazymanifestiter(self)

451

return lazymanifestiter(self)

452

453

def __len__(self):

453

def __len__(self):

454

return len(self.positions)

454

return len(self.positions)

455

456

def filtercopy(self, filterfn):

456

def filtercopy(self, filterfn):

457

# XXX should be optimized

457

# XXX should be optimized

458

c = _lazymanifest(b'')

458

c = _lazymanifest(b'')

459

for f, n, fl in self.iterentries():

459

for f, n, fl in self.iterentries():

460

if filterfn(f):

460

if filterfn(f):

461

c[f] = n, fl

461

c[f] = n, fl

462

return c

462

return c

463

464

465

try:

465

try:

466

_lazymanifest = parsers.lazymanifest

466

_lazymanifest = parsers.lazymanifest

467

except AttributeError:

467

except AttributeError:

468

pass

468

pass

469

470

471

@interfaceutil.implementer(repository.imanifestdict)

471

@interfaceutil.implementer(repository.imanifestdict)

472

class manifestdict(object):

472

class manifestdict(object):

473

def __init__(self, data=b''):

473

def __init__(self, data=b''):

474

self._lm = _lazymanifest(data)

474

self._lm = _lazymanifest(data)

475

476

def __getitem__(self, key):

476

def __getitem__(self, key):

477

return self._lm[key][0]

477

return self._lm[key][0]

478

479

def find(self, key):

479

def find(self, key):

480

return self._lm[key]

480

return self._lm[key]

481

482

def __len__(self):

482

def __len__(self):

483

return len(self._lm)

483

return len(self._lm)

484

485

def __nonzero__(self):

485

def __nonzero__(self):

486

# nonzero is covered by the __len__ function, but implementing it here

486

# nonzero is covered by the __len__ function, but implementing it here

487

# makes it easier for extensions to override.

487

# makes it easier for extensions to override.

488

return len(self._lm) != 0

488

return len(self._lm) != 0

489

490

__bool__ = __nonzero__

490

__bool__ = __nonzero__

491

492

def __setitem__(self, key, node):

492

def __setitem__(self, key, node):

493

self._lm[key] = node, self.flags(key)

493

self._lm[key] = node, self.flags(key)

494

495

def __contains__(self, key):

495

def __contains__(self, key):

496

if key is None:

496

if key is None:

497

return False

497

return False

498

return key in self._lm

498

return key in self._lm

499

500

def __delitem__(self, key):

500

def __delitem__(self, key):

501

del self._lm[key]

501

del self._lm[key]

502

503

def __iter__(self):

503

def __iter__(self):

504

return self._lm.__iter__()

504

return self._lm.__iter__()

505

506

def iterkeys(self):

506

def iterkeys(self):

507

return self._lm.iterkeys()

507

return self._lm.iterkeys()

508

509

def keys(self):

509

def keys(self):

510

return list(self.iterkeys())

510

return list(self.iterkeys())

511

512

def filesnotin(self, m2, match=None):

512

def filesnotin(self, m2, match=None):

513

'''Set of files in this manifest that are not in the other'''

513

'''Set of files in this manifest that are not in the other'''

514

if match is not None:

514

if match is not None:

515

match = matchmod.badmatch(match, lambda path, msg: None)

515

match = matchmod.badmatch(match, lambda path, msg: None)

516

sm2 = set(m2.walk(match))

516

sm2 = set(m2.walk(match))

517

return {f for f in self.walk(match) if f not in sm2}

517

return {f for f in self.walk(match) if f not in sm2}

518

return {f for f in self if f not in m2}

518

return {f for f in self if f not in m2}

519

520

@propertycache

520

@propertycache

521

def _dirs(self):

521

def _dirs(self):

522

return pathutil.dirs(self)

522

return pathutil.dirs(self)

523

524

def dirs(self):

524

def dirs(self):

525

return self._dirs

525

return self._dirs

526

527

def hasdir(self, dir):

527

def hasdir(self, dir):

528

return dir in self._dirs

528

return dir in self._dirs

529

530

def _filesfastpath(self, match):

530

def _filesfastpath(self, match):

531

"""Checks whether we can correctly and quickly iterate over matcher

531

"""Checks whether we can correctly and quickly iterate over matcher

532

files instead of over manifest files."""

532

files instead of over manifest files."""

533

files = match.files()

533

files = match.files()

534

return len(files) < 100 and (

534

return len(files) < 100 and (

535

match.isexact()

535

match.isexact()

536

or (match.prefix() and all(fn in self for fn in files))

536

or (match.prefix() and all(fn in self for fn in files))

537

)

537

)

538

539

def walk(self, match):

539

def walk(self, match):

540

"""Generates matching file names.

540

"""Generates matching file names.

541

542

Equivalent to manifest.matches(match).iterkeys(), but without creating

542

Equivalent to manifest.matches(match).iterkeys(), but without creating

543

an entirely new manifest.

543

an entirely new manifest.

544

545

It also reports nonexistent files by marking them bad with match.bad().

545

It also reports nonexistent files by marking them bad with match.bad().

546

"""

546

"""

547

if match.always():

547

if match.always():

548

for f in iter(self):

548

for f in iter(self):

549

yield f

549

yield f

550

return

550

return

551

552

fset = set(match.files())

552

fset = set(match.files())

553

554

# avoid the entire walk if we're only looking for specific files

554

# avoid the entire walk if we're only looking for specific files

555

if self._filesfastpath(match):

555

if self._filesfastpath(match):

556

for fn in sorted(fset):

556

for fn in sorted(fset):

557

if fn in self:

557

if fn in self:

558

yield fn

558

yield fn

559

return

559

return

560

561

for fn in self:

561

for fn in self:

562

if fn in fset:

562

if fn in fset:

563

# specified pattern is the exact name

563

# specified pattern is the exact name

564

fset.remove(fn)

564

fset.remove(fn)

565

if match(fn):

565

if match(fn):

566

yield fn

566

yield fn

567

568

# for dirstate.walk, files=[''] means "walk the whole tree".

568

# for dirstate.walk, files=[''] means "walk the whole tree".

569

# follow that here, too

569

# follow that here, too

570

fset.discard(b'')

570

fset.discard(b'')

571

572

for fn in sorted(fset):

572

for fn in sorted(fset):

573

if not self.hasdir(fn):

573

if not self.hasdir(fn):

574

match.bad(fn, None)

574

match.bad(fn, None)

575

576

def _matches(self, match):

576

def _matches(self, match):

577

'''generate a new manifest filtered by the match argument'''

577

'''generate a new manifest filtered by the match argument'''

578

if match.always():

578

if match.always():

579

return self.copy()

579

return self.copy()

580

581

if self._filesfastpath(match):

581

if self._filesfastpath(match):

582

m = manifestdict()

582

m = manifestdict()

583

lm = self._lm

583

lm = self._lm

584

for fn in match.files():

584

for fn in match.files():

585

if fn in lm:

585

if fn in lm:

586

m._lm[fn] = lm[fn]

586

m._lm[fn] = lm[fn]

587

return m

587

return m

588

589

m = manifestdict()

589

m = manifestdict()

590

m._lm = self._lm.filtercopy(match)

590

m._lm = self._lm.filtercopy(match)

591

return m

591

return m

592

593

def diff(self, m2, match=None, clean=False):

593

def diff(self, m2, match=None, clean=False):

594

"""Finds changes between the current manifest and m2.

594

"""Finds changes between the current manifest and m2.

595

596

Args:

596

Args:

597

m2: the manifest to which this manifest should be compared.

597

m2: the manifest to which this manifest should be compared.

598

clean: if true, include files unchanged between these manifests

598

clean: if true, include files unchanged between these manifests

599

with a None value in the returned dictionary.

599

with a None value in the returned dictionary.

600

601

The result is returned as a dict with filename as key and

601

The result is returned as a dict with filename as key and

602

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

602

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

603

nodeid in the current/other manifest and fl1/fl2 is the flag

603

nodeid in the current/other manifest and fl1/fl2 is the flag

604

in the current/other manifest. Where the file does not exist,

604

in the current/other manifest. Where the file does not exist,

605

the nodeid will be None and the flags will be the empty

605

the nodeid will be None and the flags will be the empty

606

string.

606

string.

607

"""

607

"""

608

if match:

608

if match:

609

m1 = self._matches(match)

609

m1 = self._matches(match)

610

m2 = m2._matches(match)

610

m2 = m2._matches(match)

611

return m1.diff(m2, clean=clean)

611

return m1.diff(m2, clean=clean)

612

return self._lm.diff(m2._lm, clean)

612

return self._lm.diff(m2._lm, clean)

613

614

def setflag(self, key, flag):

614

def setflag(self, key, flag):

615

if flag not in _manifestflags:

615

if flag not in _manifestflags:

616

raise TypeError(b"Invalid manifest flag set.")

616

raise TypeError(b"Invalid manifest flag set.")

617

self._lm[key] = self[key], flag

617

self._lm[key] = self[key], flag

618

619

def get(self, key, default=None):

619

def get(self, key, default=None):

620

try:

620

try:

621

return self._lm[key][0]

621

return self._lm[key][0]

622

except KeyError:

622

except KeyError:

623

return default

623

return default

624

625

def flags(self, key):

625

def flags(self, key):

626

try:

626

try:

627

return self._lm[key][1]

627

return self._lm[key][1]

628

except KeyError:

628

except KeyError:

629

return b''

629

return b''

630

631

def copy(self):

631

def copy(self):

632

c = manifestdict()

632

c = manifestdict()

633

c._lm = self._lm.copy()

633

c._lm = self._lm.copy()

634

return c

634

return c

635

636

def items(self):

636

def items(self):

637

return (x[:2] for x in self._lm.iterentries())

637

return (x[:2] for x in self._lm.iterentries())

638

639

def iteritems(self):

639

def iteritems(self):

640

return (x[:2] for x in self._lm.iterentries())

640

return (x[:2] for x in self._lm.iterentries())

641

642

def iterentries(self):

642

def iterentries(self):

643

return self._lm.iterentries()

643

return self._lm.iterentries()

644

645

def text(self):

645

def text(self):

646

# most likely uses native version

646

# most likely uses native version

647

return self._lm.text()

647

return self._lm.text()

648

649

def fastdelta(self, base, changes):

649

def fastdelta(self, base, changes):

650

"""Given a base manifest text as a bytearray and a list of changes

650

"""Given a base manifest text as a bytearray and a list of changes

651

relative to that text, compute a delta that can be used by revlog.

651

relative to that text, compute a delta that can be used by revlog.

652

"""

652

"""

653

delta = []

653

delta = []

654

dstart = None

654

dstart = None

655

dend = None

655

dend = None

656

dline = [b""]

656

dline = [b""]

657

start = 0

657

start = 0

658

# zero copy representation of base as a buffer

658

# zero copy representation of base as a buffer

659

addbuf = util.buffer(base)

659

addbuf = util.buffer(base)

660

661

changes = list(changes)

661

changes = list(changes)

662

if len(changes) < FASTDELTA_TEXTDIFF_THRESHOLD:

662

if len(changes) < FASTDELTA_TEXTDIFF_THRESHOLD:

663

# start with a readonly loop that finds the offset of

663

# start with a readonly loop that finds the offset of

664

# each line and creates the deltas

664

# each line and creates the deltas

665

for f, todelete in changes:

665

for f, todelete in changes:

666

# bs will either be the index of the item or the insert point

666

# bs will either be the index of the item or the insert point

667

start, end = _msearch(addbuf, f, start)

667

start, end = _msearch(addbuf, f, start)

668

if not todelete:

668

if not todelete:

669

h, fl = self._lm[f]

669

h, fl = self._lm[f]

670

l = b"%s\0%s%s\n" % (f, hex(h), fl)

670

l = b"%s\0%s%s\n" % (f, hex(h), fl)

671

else:

671

else:

672

if start == end:

672

if start == end:

673

# item we want to delete was not found, error out

673

# item we want to delete was not found, error out

674

raise AssertionError(

674

raise AssertionError(

675

_(b"failed to remove %s from manifest") % f

675

_(b"failed to remove %s from manifest") % f

676

)

676

)

677

l = b""

677

l = b""

678

if dstart is not None and dstart <= start and dend >= start:

678

if dstart is not None and dstart <= start and dend >= start:

679

if dend < end:

679

if dend < end:

680

dend = end

680

dend = end

681

if l:

681

if l:

682

dline.append(l)

682

dline.append(l)

683

else:

683

else:

684

if dstart is not None:

684

if dstart is not None:

685

delta.append([dstart, dend, b"".join(dline)])

685

delta.append([dstart, dend, b"".join(dline)])

686

dstart = start

686

dstart = start

687

dend = end

687

dend = end

688

dline = [l]

688

dline = [l]

689

690

if dstart is not None:

690

if dstart is not None:

691

delta.append([dstart, dend, b"".join(dline)])

691

delta.append([dstart, dend, b"".join(dline)])

692

# apply the delta to the base, and get a delta for addrevision

692

# apply the delta to the base, and get a delta for addrevision

693

deltatext, arraytext = _addlistdelta(base, delta)

693

deltatext, arraytext = _addlistdelta(base, delta)

694

else:

694

else:

695

# For large changes, it's much cheaper to just build the text and

695

# For large changes, it's much cheaper to just build the text and

696

# diff it.

696

# diff it.

697

arraytext = bytearray(self.text())

697

arraytext = bytearray(self.text())

698

deltatext = mdiff.textdiff(

698

deltatext = mdiff.textdiff(

699

util.buffer(base), util.buffer(arraytext)

699

util.buffer(base), util.buffer(arraytext)

700

)

700

)

701

702

return arraytext, deltatext

702

return arraytext, deltatext

703

704

705

def _msearch(m, s, lo=0, hi=None):

705

def _msearch(m, s, lo=0, hi=None):

706

"""return a tuple (start, end) that says where to find s within m.

706

"""return a tuple (start, end) that says where to find s within m.

707

708

If the string is found m[start:end] are the line containing

708

If the string is found m[start:end] are the line containing

709

that string. If start == end the string was not found and

709

that string. If start == end the string was not found and

710

they indicate the proper sorted insertion point.

710

they indicate the proper sorted insertion point.

711

712

m should be a buffer, a memoryview or a byte string.

712

m should be a buffer, a memoryview or a byte string.

713

s is a byte string"""

713

s is a byte string"""

714

715

def advance(i, c):

715

def advance(i, c):

716

while i < lenm and m[i : i + 1] != c:

716

while i < lenm and m[i : i + 1] != c:

717

i += 1

717

i += 1

718

return i

718

return i

719

720

if not s:

720

if not s:

721

return (lo, lo)

721

return (lo, lo)

722

lenm = len(m)

722

lenm = len(m)

723

if not hi:

723

if not hi:

724

hi = lenm

724

hi = lenm

725

while lo < hi:

725

while lo < hi:

726

mid = (lo + hi) // 2

726

mid = (lo + hi) // 2

727

start = mid

727

start = mid

728

while start > 0 and m[start - 1 : start] != b'\n':

728

while start > 0 and m[start - 1 : start] != b'\n':

729

start -= 1

729

start -= 1

730

end = advance(start, b'\0')

730

end = advance(start, b'\0')

731

if bytes(m[start:end]) < s:

731

if bytes(m[start:end]) < s:

732

# we know that after the null there are 40 bytes of sha1

732

# we know that after the null there are 40 bytes of sha1

733

# this translates to the bisect lo = mid + 1

733

# this translates to the bisect lo = mid + 1

734

lo = advance(end + 40, b'\n') + 1

734

lo = advance(end + 40, b'\n') + 1

735

else:

735

else:

736

# this translates to the bisect hi = mid

736

# this translates to the bisect hi = mid

737

hi = start

737

hi = start

738

end = advance(lo, b'\0')

738

end = advance(lo, b'\0')

739

found = m[lo:end]

739

found = m[lo:end]

740

if s == found:

740

if s == found:

741

# we know that after the null there are 40 bytes of sha1

741

# we know that after the null there are 40 bytes of sha1

742

end = advance(end + 40, b'\n')

742

end = advance(end + 40, b'\n')

743

return (lo, end + 1)

743

return (lo, end + 1)

744

else:

744

else:

745

return (lo, lo)

745

return (lo, lo)

746

747

748

def _checkforbidden(l):

748

def _checkforbidden(l):

749

"""Check filenames for illegal characters."""

749

"""Check filenames for illegal characters."""

750

for f in l:

750

for f in l:

751

if b'\n' in f or b'\r' in f:

751

if b'\n' in f or b'\r' in f:

752

raise error.StorageError(

752

raise error.StorageError(

753

_(b"'\\n' and '\\r' disallowed in filenames: %r")

753

_(b"'\\n' and '\\r' disallowed in filenames: %r")

754

% pycompat.bytestr(f)

754

% pycompat.bytestr(f)

755

)

755

)

756

757

758

# apply the changes collected during the bisect loop to our addlist

758

# apply the changes collected during the bisect loop to our addlist

759

# return a delta suitable for addrevision

759

# return a delta suitable for addrevision

760

def _addlistdelta(addlist, x):

760

def _addlistdelta(addlist, x):

761

# for large addlist arrays, building a new array is cheaper

761

# for large addlist arrays, building a new array is cheaper

762

# than repeatedly modifying the existing one

762

# than repeatedly modifying the existing one

763

currentposition = 0

763

currentposition = 0

764

newaddlist = bytearray()

764

newaddlist = bytearray()

765

766

for start, end, content in x:

766

for start, end, content in x:

767

newaddlist += addlist[currentposition:start]

767

newaddlist += addlist[currentposition:start]

768

if content:

768

if content:

769

newaddlist += bytearray(content)

769

newaddlist += bytearray(content)

770

771

currentposition = end

771

currentposition = end

772

773

newaddlist += addlist[currentposition:]

773

newaddlist += addlist[currentposition:]

774

775

deltatext = b"".join(

775

deltatext = b"".join(

776

struct.pack(b">lll", start, end, len(content)) + content

776

struct.pack(b">lll", start, end, len(content)) + content

777

for start, end, content in x

777

for start, end, content in x

778

)

778

)

779

return deltatext, newaddlist

779

return deltatext, newaddlist

780

781

782

def _splittopdir(f):

782

def _splittopdir(f):

783

if b'/' in f:

783

if b'/' in f:

784

dir, subpath = f.split(b'/', 1)

784

dir, subpath = f.split(b'/', 1)

785

return dir + b'/', subpath

785

return dir + b'/', subpath

786

else:

786

else:

787

return b'', f

787

return b'', f

788

789

790

_noop = lambda s: None

790

_noop = lambda s: None

791

792

793

@interfaceutil.implementer(repository.imanifestdict)

793

@interfaceutil.implementer(repository.imanifestdict)

794

class treemanifest(object):

794

class treemanifest(object):

795

def __init__(self, dir=b'', text=b''):

795

def __init__(self, dir=b'', text=b''):

796

self._dir = dir

796

self._dir = dir

797

self._node = nullid

797

self._node = nullid

798

self._loadfunc = _noop

798

self._loadfunc = _noop

799

self._copyfunc = _noop

799

self._copyfunc = _noop

800

self._dirty = False

800

self._dirty = False

801

self._dirs = {}

801

self._dirs = {}

802

self._lazydirs = {}

802

self._lazydirs = {}

803

# Using _lazymanifest here is a little slower than plain old dicts

803

# Using _lazymanifest here is a little slower than plain old dicts

804

self._files = {}

804

self._files = {}

805

self._flags = {}

805

self._flags = {}

806

if text:

806

if text:

807

808

def readsubtree(subdir, subm):

808

def readsubtree(subdir, subm):

809

raise AssertionError(

809

raise AssertionError(

810

b'treemanifest constructor only accepts flat manifests'

810

b'treemanifest constructor only accepts flat manifests'

811

)

811

)

812

813

self.parse(text, readsubtree)

813

self.parse(text, readsubtree)

814

self._dirty = True # Mark flat manifest dirty after parsing

814

self._dirty = True # Mark flat manifest dirty after parsing

815

816

def _subpath(self, path):

816

def _subpath(self, path):

817

return self._dir + path

817

return self._dir + path

818

819

def _loadalllazy(self):

819

def _loadalllazy(self):

820

selfdirs = self._dirs

820

selfdirs = self._dirs

821

subpath = self._subpath

821

subpath = self._subpath

822

for d, (node, readsubtree, docopy) in pycompat.iteritems(

822

for d, (node, readsubtree, docopy) in pycompat.iteritems(

823

self._lazydirs

823

self._lazydirs

824

):

824

):

825

if docopy:

825

if docopy:

826

selfdirs[d] = readsubtree(subpath(d), node).copy()

826

selfdirs[d] = readsubtree(subpath(d), node).copy()

827

else:

827

else:

828

selfdirs[d] = readsubtree(subpath(d), node)

828

selfdirs[d] = readsubtree(subpath(d), node)

829

self._lazydirs = {}

829

self._lazydirs = {}

830

831

def _loadlazy(self, d):

831

def _loadlazy(self, d):

832

v = self._lazydirs.get(d)

832

v = self._lazydirs.get(d)

833

if v:

833

if v:

834

node, readsubtree, docopy = v

834

node, readsubtree, docopy = v

835

if docopy:

835

if docopy:

836

self._dirs[d] = readsubtree(self._subpath(d), node).copy()

836

self._dirs[d] = readsubtree(self._subpath(d), node).copy()

837

else:

837

else:

838

self._dirs[d] = readsubtree(self._subpath(d), node)

838

self._dirs[d] = readsubtree(self._subpath(d), node)

839

del self._lazydirs[d]

839

del self._lazydirs[d]

840

841

def _loadchildrensetlazy(self, visit):

841

def _loadchildrensetlazy(self, visit):

842

if not visit:

842

if not visit:

843

return None

843

return None

844

if visit == b'all' or visit == b'this':

844

if visit == b'all' or visit == b'this':

845

self._loadalllazy()

845

self._loadalllazy()

846

return None

846

return None

847

848

loadlazy = self._loadlazy

848

loadlazy = self._loadlazy

849

for k in visit:

849

for k in visit:

850

loadlazy(k + b'/')

850

loadlazy(k + b'/')

851

return visit

851

return visit

852

853

def _loaddifflazy(self, t1, t2):

853

def _loaddifflazy(self, t1, t2):

854

"""load items in t1 and t2 if they're needed for diffing.

854

"""load items in t1 and t2 if they're needed for diffing.

855

856

The criteria currently is:

856

The criteria currently is:

857

- if it's not present in _lazydirs in either t1 or t2, load it in the

857

- if it's not present in _lazydirs in either t1 or t2, load it in the

858

other (it may already be loaded or it may not exist, doesn't matter)

858

other (it may already be loaded or it may not exist, doesn't matter)

859

- if it's present in _lazydirs in both, compare the nodeid; if it

859

- if it's present in _lazydirs in both, compare the nodeid; if it

860

differs, load it in both

860

differs, load it in both

861

"""

861

"""

862

toloadlazy = []

862

toloadlazy = []

863

for d, v1 in pycompat.iteritems(t1._lazydirs):

863

for d, v1 in pycompat.iteritems(t1._lazydirs):

864

v2 = t2._lazydirs.get(d)

864

v2 = t2._lazydirs.get(d)

865

if not v2 or v2[0] != v1[0]:

865

if not v2 or v2[0] != v1[0]:

866

toloadlazy.append(d)

866

toloadlazy.append(d)

867

for d, v1 in pycompat.iteritems(t2._lazydirs):

867

for d, v1 in pycompat.iteritems(t2._lazydirs):

868

if d not in t1._lazydirs:

868

if d not in t1._lazydirs:

869

toloadlazy.append(d)

869

toloadlazy.append(d)

870

871

for d in toloadlazy:

871

for d in toloadlazy:

872

t1._loadlazy(d)

872

t1._loadlazy(d)

873

t2._loadlazy(d)

873

t2._loadlazy(d)

874

875

def __len__(self):

875

def __len__(self):

876

self._load()

876

self._load()

877

size = len(self._files)

877

size = len(self._files)

878

self._loadalllazy()

878

self._loadalllazy()

879

for m in self._dirs.values():

879

for m in self._dirs.values():

880

size += m.__len__()

880

size += m.__len__()

881

return size

881

return size

882

883

def __nonzero__(self):

883

def __nonzero__(self):

884

# Faster than "__len() != 0" since it avoids loading sub-manifests

884

# Faster than "__len() != 0" since it avoids loading sub-manifests

885

return not self._isempty()

885

return not self._isempty()

886

887

__bool__ = __nonzero__

887

__bool__ = __nonzero__

888

889

def _isempty(self):

889

def _isempty(self):

890

self._load() # for consistency; already loaded by all callers

890

self._load() # for consistency; already loaded by all callers

891

# See if we can skip loading everything.

891

# See if we can skip loading everything.

892

if self._files or (

892

if self._files or (

893

self._dirs and any(not m._isempty() for m in self._dirs.values())

893

self._dirs and any(not m._isempty() for m in self._dirs.values())

894

):

894

):

895

return False

895

return False

896

self._loadalllazy()

896

self._loadalllazy()

897

return not self._dirs or all(m._isempty() for m in self._dirs.values())

897

return not self._dirs or all(m._isempty() for m in self._dirs.values())

898

899

@encoding.strmethod

899

@encoding.strmethod

900

def __repr__(self):

900

def __repr__(self):

901

return (

901

return (

902

b'<treemanifest dir=%s, node=%s, loaded=%r, dirty=%r at 0x%x>'

902

b'<treemanifest dir=%s, node=%s, loaded=%r, dirty=%r at 0x%x>'

903

% (

903

% (

904

self._dir,

904

self._dir,

905

hex(self._node),

905

hex(self._node),

906

bool(self._loadfunc is _noop),

906

bool(self._loadfunc is _noop),

907

self._dirty,

907

self._dirty,

908

id(self),

908

id(self),

909

)

909

)

910

)

910

)

911

912

def dir(self):

912

def dir(self):

913

"""The directory that this tree manifest represents, including a

913

"""The directory that this tree manifest represents, including a

914

trailing '/'. Empty string for the repo root directory."""

914

trailing '/'. Empty string for the repo root directory."""

915

return self._dir

915

return self._dir

916

917

def node(self):

917

def node(self):

918

"""This node of this instance. nullid for unsaved instances. Should

918

"""This node of this instance. nullid for unsaved instances. Should

919

be updated when the instance is read or written from a revlog.

919

be updated when the instance is read or written from a revlog.

920

"""

920

"""

921

assert not self._dirty

921

assert not self._dirty

922

return self._node

922

return self._node

923

924

def setnode(self, node):

924

def setnode(self, node):

925

self._node = node

925

self._node = node

926

self._dirty = False

926

self._dirty = False

927

928

def iterentries(self):

928

def iterentries(self):

929

self._load()

929

self._load()

930

self._loadalllazy()

930

self._loadalllazy()

931

for p, n in sorted(

931

for p, n in sorted(

932

itertools.chain(self._dirs.items(), self._files.items())

932

itertools.chain(self._dirs.items(), self._files.items())

933

):

933

):

934

if p in self._files:

934

if p in self._files:

935

yield self._subpath(p), n, self._flags.get(p, b'')

935

yield self._subpath(p), n, self._flags.get(p, b'')

936

else:

936

else:

937

for x in n.iterentries():

937

for x in n.iterentries():

938

yield x

938

yield x

939

940

def items(self):

940

def items(self):

941

self._load()

941

self._load()

942

self._loadalllazy()

942

self._loadalllazy()

943

for p, n in sorted(

943

for p, n in sorted(

944

itertools.chain(self._dirs.items(), self._files.items())

944

itertools.chain(self._dirs.items(), self._files.items())

945

):

945

):

946

if p in self._files:

946

if p in self._files:

947

yield self._subpath(p), n

947

yield self._subpath(p), n

948

else:

948

else:

949

for f, sn in pycompat.iteritems(n):

949

for f, sn in pycompat.iteritems(n):

950

yield f, sn

950

yield f, sn

951

952

iteritems = items

952

iteritems = items

953

954

def iterkeys(self):

954

def iterkeys(self):

955

self._load()

955

self._load()

956

self._loadalllazy()

956

self._loadalllazy()

957

for p in sorted(itertools.chain(self._dirs, self._files)):

957

for p in sorted(itertools.chain(self._dirs, self._files)):

958

if p in self._files:

958

if p in self._files:

959

yield self._subpath(p)

959

yield self._subpath(p)

960

else:

960

else:

961

for f in self._dirs[p]:

961

for f in self._dirs[p]:

962

yield f

962

yield f

963

964

def keys(self):

964

def keys(self):

965

return list(self.iterkeys())

965

return list(self.iterkeys())

966

967

def __iter__(self):

967

def __iter__(self):

968

return self.iterkeys()

968

return self.iterkeys()

969

970

def __contains__(self, f):

970

def __contains__(self, f):

971

if f is None:

971

if f is None:

972

return False

972

return False

973

self._load()

973

self._load()

974

dir, subpath = _splittopdir(f)

974

dir, subpath = _splittopdir(f)

975

if dir:

975

if dir:

976

self._loadlazy(dir)

976

self._loadlazy(dir)

977

978

if dir not in self._dirs:

978

if dir not in self._dirs:

979

return False

979

return False

980

981

return self._dirs[dir].__contains__(subpath)

981

return self._dirs[dir].__contains__(subpath)

982

else:

982

else:

983

return f in self._files

983

return f in self._files

984

985

def get(self, f, default=None):

985

def get(self, f, default=None):

986

self._load()

986

self._load()

987

dir, subpath = _splittopdir(f)

987

dir, subpath = _splittopdir(f)

988

if dir:

988

if dir:

989

self._loadlazy(dir)

989

self._loadlazy(dir)

990

991

if dir not in self._dirs:

991

if dir not in self._dirs:

992

return default

992

return default

993

return self._dirs[dir].get(subpath, default)

993

return self._dirs[dir].get(subpath, default)

994

else:

994

else:

995

return self._files.get(f, default)

995

return self._files.get(f, default)

996

997

def __getitem__(self, f):

997

def __getitem__(self, f):

998

self._load()

998

self._load()

999

dir, subpath = _splittopdir(f)

999

dir, subpath = _splittopdir(f)

1000

if dir:

1000

if dir:

1001

self._loadlazy(dir)

1001

self._loadlazy(dir)

1002

1003

return self._dirs[dir].__getitem__(subpath)

1003

return self._dirs[dir].__getitem__(subpath)

1004

else:

1004

else:

1005

return self._files[f]

1005

return self._files[f]

1006

1007

def flags(self, f):

1007

def flags(self, f):

1008

self._load()

1008

self._load()

1009

dir, subpath = _splittopdir(f)

1009

dir, subpath = _splittopdir(f)

1010

if dir:

1010

if dir:

1011

self._loadlazy(dir)

1011

self._loadlazy(dir)

1012

1013

if dir not in self._dirs:

1013

if dir not in self._dirs:

1014

return b''

1014

return b''

1015

return self._dirs[dir].flags(subpath)

1015

return self._dirs[dir].flags(subpath)

1016

else:

1016

else:

1017

if f in self._lazydirs or f in self._dirs:

1017

if f in self._lazydirs or f in self._dirs:

1018

return b''

1018

return b''

1019

return self._flags.get(f, b'')

1019

return self._flags.get(f, b'')

1020

1021

def find(self, f):

1021

def find(self, f):

1022

self._load()

1022

self._load()

1023

dir, subpath = _splittopdir(f)

1023

dir, subpath = _splittopdir(f)

1024

if dir:

1024

if dir:

1025

self._loadlazy(dir)

1025

self._loadlazy(dir)

1026

1027

return self._dirs[dir].find(subpath)

1027

return self._dirs[dir].find(subpath)

1028

else:

1028

else:

1029

return self._files[f], self._flags.get(f, b'')

1029

return self._files[f], self._flags.get(f, b'')

1030

1031

def __delitem__(self, f):

1031

def __delitem__(self, f):

1032

self._load()

1032

self._load()

1033

dir, subpath = _splittopdir(f)

1033

dir, subpath = _splittopdir(f)

1034

if dir:

1034

if dir:

1035

self._loadlazy(dir)

1035

self._loadlazy(dir)

1036

1037

self._dirs[dir].__delitem__(subpath)

1037

self._dirs[dir].__delitem__(subpath)

1038

# If the directory is now empty, remove it

1038

# If the directory is now empty, remove it

1039

if self._dirs[dir]._isempty():

1039

if self._dirs[dir]._isempty():

1040

del self._dirs[dir]

1040

del self._dirs[dir]

1041

else:

1041

else:

1042

del self._files[f]

1042

del self._files[f]

1043

if f in self._flags:

1043

if f in self._flags:

1044

del self._flags[f]

1044

del self._flags[f]

1045

self._dirty = True

1045

self._dirty = True

1046

1047

def __setitem__(self, f, n):

1047

def __setitem__(self, f, n):

1048

assert n is not None

1048

assert n is not None

1049

self._load()

1049

self._load()

1050

dir, subpath = _splittopdir(f)

1050

dir, subpath = _splittopdir(f)

1051

if dir:

1051

if dir:

1052

self._loadlazy(dir)

1052

self._loadlazy(dir)

1053

if dir not in self._dirs:

1053

if dir not in self._dirs:

1054

self._dirs[dir] = treemanifest(self._subpath(dir))

1054

self._dirs[dir] = treemanifest(self._subpath(dir))

1055

self._dirs[dir].__setitem__(subpath, n)

1055

self._dirs[dir].__setitem__(subpath, n)

1056

else:

1056

else:

1057

# manifest nodes are either 20 bytes or 32 bytes,

1057

# manifest nodes are either 20 bytes or 32 bytes,

1058

# depending on the hash in use. Assert this as historically

1058

# depending on the hash in use. Assert this as historically

1059

# sometimes extra bytes were added.

1059

# sometimes extra bytes were added.

1060

assert len(n) in (20, 32)

1060

assert len(n) in (20, 32)

1061

self._files[f] = n

1061

self._files[f] = n

1062

self._dirty = True

1062

self._dirty = True

1063

1064

def _load(self):

1064

def _load(self):

1065

if self._loadfunc is not _noop:

1065

if self._loadfunc is not _noop:

1066

lf, self._loadfunc = self._loadfunc, _noop

1066

lf, self._loadfunc = self._loadfunc, _noop

1067

lf(self)

1067

lf(self)

1068

elif self._copyfunc is not _noop:

1068

elif self._copyfunc is not _noop:

1069

cf, self._copyfunc = self._copyfunc, _noop

1069

cf, self._copyfunc = self._copyfunc, _noop

1070

cf(self)

1070

cf(self)

1071

1072

def setflag(self, f, flags):

1072

def setflag(self, f, flags):

1073

"""Set the flags (symlink, executable) for path f."""

1073

"""Set the flags (symlink, executable) for path f."""

1074

if flags not in _manifestflags:

1074

if flags not in _manifestflags:

1075

raise TypeError(b"Invalid manifest flag set.")

1075

raise TypeError(b"Invalid manifest flag set.")

1076

self._load()

1076

self._load()

1077

dir, subpath = _splittopdir(f)

1077

dir, subpath = _splittopdir(f)

1078

if dir:

1078

if dir:

1079

self._loadlazy(dir)

1079

self._loadlazy(dir)

1080

if dir not in self._dirs:

1080

if dir not in self._dirs:

1081

self._dirs[dir] = treemanifest(self._subpath(dir))

1081

self._dirs[dir] = treemanifest(self._subpath(dir))

1082

self._dirs[dir].setflag(subpath, flags)

1082

self._dirs[dir].setflag(subpath, flags)

1083

else:

1083

else:

1084

self._flags[f] = flags

1084

self._flags[f] = flags

1085

self._dirty = True

1085

self._dirty = True

1086

1087

def copy(self):

1087

def copy(self):

1088

copy = treemanifest(self._dir)

1088

copy = treemanifest(self._dir)

1089

copy._node = self._node

1089

copy._node = self._node

1090

copy._dirty = self._dirty

1090

copy._dirty = self._dirty

1091

if self._copyfunc is _noop:

1091

if self._copyfunc is _noop:

1092

1093

def _copyfunc(s):

1093

def _copyfunc(s):

1094

self._load()

1094

self._load()

1095

s._lazydirs = {

1095

s._lazydirs = {

1096

d: (n, r, True)

1096

d: (n, r, True)

1097

for d, (n, r, c) in pycompat.iteritems(self._lazydirs)

1097

for d, (n, r, c) in pycompat.iteritems(self._lazydirs)

1098

}

1098

}

1099

sdirs = s._dirs

1099

sdirs = s._dirs

1100

for d, v in pycompat.iteritems(self._dirs):

1100

for d, v in pycompat.iteritems(self._dirs):

1101

sdirs[d] = v.copy()

1101

sdirs[d] = v.copy()

1102

s._files = dict.copy(self._files)

1102

s._files = dict.copy(self._files)

1103

s._flags = dict.copy(self._flags)

1103

s._flags = dict.copy(self._flags)

1104

1105

if self._loadfunc is _noop:

1105

if self._loadfunc is _noop:

1106

_copyfunc(copy)

1106

_copyfunc(copy)

1107

else:

1107

else:

1108

copy._copyfunc = _copyfunc

1108

copy._copyfunc = _copyfunc

1109

else:

1109

else:

1110

copy._copyfunc = self._copyfunc

1110

copy._copyfunc = self._copyfunc

1111

return copy

1111

return copy

1112

1113

def filesnotin(self, m2, match=None):

1113

def filesnotin(self, m2, match=None):

1114

'''Set of files in this manifest that are not in the other'''

1114

'''Set of files in this manifest that are not in the other'''

1115

if match and not match.always():

1115

if match and not match.always():

1116

m1 = self._matches(match)

1116

m1 = self._matches(match)

1117

m2 = m2._matches(match)

1117

m2 = m2._matches(match)

1118

return m1.filesnotin(m2)

1118

return m1.filesnotin(m2)

1119

1120

files = set()

1120

files = set()

1121

1122

def _filesnotin(t1, t2):

1122

def _filesnotin(t1, t2):

1123

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1123

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1124

return

1124

return

1125

t1._load()

1125

t1._load()

1126

t2._load()

1126

t2._load()

1127

self._loaddifflazy(t1, t2)

1127

self._loaddifflazy(t1, t2)

1128

for d, m1 in pycompat.iteritems(t1._dirs):

1128

for d, m1 in pycompat.iteritems(t1._dirs):

1129

if d in t2._dirs:

1129

if d in t2._dirs:

1130

m2 = t2._dirs[d]

1130

m2 = t2._dirs[d]

1131

_filesnotin(m1, m2)

1131

_filesnotin(m1, m2)

1132

else:

1132

else:

1133

files.update(m1.iterkeys())

1133

files.update(m1.iterkeys())

1134

1135

for fn in t1._files:

1135

for fn in t1._files:

1136

if fn not in t2._files:

1136

if fn not in t2._files:

1137

files.add(t1._subpath(fn))

1137

files.add(t1._subpath(fn))

1138

1139

_filesnotin(self, m2)

1139

_filesnotin(self, m2)

1140

return files

1140

return files

1141

1142

@propertycache

1142

@propertycache

1143

def _alldirs(self):

1143

def _alldirs(self):

1144

return pathutil.dirs(self)

1144

return pathutil.dirs(self)

1145

1146

def dirs(self):

1146

def dirs(self):

1147

return self._alldirs

1147

return self._alldirs

1148

1149

def hasdir(self, dir):

1149

def hasdir(self, dir):

1150

self._load()

1150

self._load()

1151

topdir, subdir = _splittopdir(dir)

1151

topdir, subdir = _splittopdir(dir)

1152

if topdir:

1152

if topdir:

1153

self._loadlazy(topdir)

1153

self._loadlazy(topdir)

1154

if topdir in self._dirs:

1154

if topdir in self._dirs:

1155

return self._dirs[topdir].hasdir(subdir)

1155

return self._dirs[topdir].hasdir(subdir)

1156

return False

1156

return False

1157

dirslash = dir + b'/'

1157

dirslash = dir + b'/'

1158

return dirslash in self._dirs or dirslash in self._lazydirs

1158

return dirslash in self._dirs or dirslash in self._lazydirs

1159

1160

def walk(self, match):

1160

def walk(self, match):

1161

"""Generates matching file names.

1161

"""Generates matching file names.

1162

1163

It also reports nonexistent files by marking them bad with match.bad().

1163

It also reports nonexistent files by marking them bad with match.bad().

1164

"""

1164

"""

1165

if match.always():

1165

if match.always():

1166

for f in iter(self):

1166

for f in iter(self):

1167

yield f

1167

yield f

1168

return

1168

return

1169

1170

fset = set(match.files())

1170

fset = set(match.files())

1171

1172

for fn in self._walk(match):

1172

for fn in self._walk(match):

1173

if fn in fset:

1173

if fn in fset:

1174

# specified pattern is the exact name

1174

# specified pattern is the exact name

1175

fset.remove(fn)

1175

fset.remove(fn)

1176

yield fn

1176

yield fn

1177

1178

# for dirstate.walk, files=[''] means "walk the whole tree".

1178

# for dirstate.walk, files=[''] means "walk the whole tree".

1179

# follow that here, too

1179

# follow that here, too

1180

fset.discard(b'')

1180

fset.discard(b'')

1181

1182

for fn in sorted(fset):

1182

for fn in sorted(fset):

1183

if not self.hasdir(fn):

1183

if not self.hasdir(fn):

1184

match.bad(fn, None)

1184

match.bad(fn, None)

1185

1186

def _walk(self, match):

1186

def _walk(self, match):

1187

'''Recursively generates matching file names for walk().'''

1187

'''Recursively generates matching file names for walk().'''

1188

visit = match.visitchildrenset(self._dir[:-1])

1188

visit = match.visitchildrenset(self._dir[:-1])

1189

if not visit:

1189

if not visit:

1190

return

1190

return

1191

1192

# yield this dir's files and walk its submanifests

1192

# yield this dir's files and walk its submanifests

1193

self._load()

1193

self._load()

1194

visit = self._loadchildrensetlazy(visit)

1194

visit = self._loadchildrensetlazy(visit)

1195

for p in sorted(list(self._dirs) + list(self._files)):

1195

for p in sorted(list(self._dirs) + list(self._files)):

1196

if p in self._files:

1196

if p in self._files:

1197

fullp = self._subpath(p)

1197

fullp = self._subpath(p)

1198

if match(fullp):

1198

if match(fullp):

1199

yield fullp

1199

yield fullp

1200

else:

1200

else:

1201

if not visit or p[:-1] in visit:

1201

if not visit or p[:-1] in visit:

1202

for f in self._dirs[p]._walk(match):

1202

for f in self._dirs[p]._walk(match):

1203

yield f

1203

yield f

1204

1205

def _matches(self, match):

1205

def _matches(self, match):

1206

"""recursively generate a new manifest filtered by the match argument."""

1206

"""recursively generate a new manifest filtered by the match argument."""

1207

if match.always():

1207

if match.always():

1208

return self.copy()

1208

return self.copy()

1209

return self._matches_inner(match)

1209

return self._matches_inner(match)

1210

1211

def _matches_inner(self, match):

1211

def _matches_inner(self, match):

1212

if match.always():

1212

if match.always():

1213

return self.copy()

1213

return self.copy()

1214

1215

visit = match.visitchildrenset(self._dir[:-1])

1215

visit = match.visitchildrenset(self._dir[:-1])

1216

if visit == b'all':

1216

if visit == b'all':

1217

return self.copy()

1217

return self.copy()

1218

ret = treemanifest(self._dir)

1218

ret = treemanifest(self._dir)

1219

if not visit:

1219

if not visit:

1220

return ret

1220

return ret

1221

1222

self._load()

1222

self._load()

1223

for fn in self._files:

1223

for fn in self._files:

1224

# While visitchildrenset *usually* lists only subdirs, this is

1224

# While visitchildrenset *usually* lists only subdirs, this is

1225

# actually up to the matcher and may have some files in the set().

1225

# actually up to the matcher and may have some files in the set().

1226

# If visit == 'this', we should obviously look at the files in this

1226

# If visit == 'this', we should obviously look at the files in this

1227

# directory; if visit is a set, and fn is in it, we should inspect

1227

# directory; if visit is a set, and fn is in it, we should inspect

1228

# fn (but no need to inspect things not in the set).

1228

# fn (but no need to inspect things not in the set).

1229

if visit != b'this' and fn not in visit:

1229

if visit != b'this' and fn not in visit:

1230

continue

1230

continue

1231

fullp = self._subpath(fn)

1231

fullp = self._subpath(fn)

1232

# visitchildrenset isn't perfect, we still need to call the regular

1232

# visitchildrenset isn't perfect, we still need to call the regular

1233

# matcher code to further filter results.

1233

# matcher code to further filter results.

1234

if not match(fullp):

1234

if not match(fullp):

1235

continue

1235

continue

1236

ret._files[fn] = self._files[fn]

1236

ret._files[fn] = self._files[fn]

1237

if fn in self._flags:

1237

if fn in self._flags:

1238

ret._flags[fn] = self._flags[fn]

1238

ret._flags[fn] = self._flags[fn]

1239

1240

visit = self._loadchildrensetlazy(visit)

1240

visit = self._loadchildrensetlazy(visit)

1241

for dir, subm in pycompat.iteritems(self._dirs):

1241

for dir, subm in pycompat.iteritems(self._dirs):

1242

if visit and dir[:-1] not in visit:

1242

if visit and dir[:-1] not in visit:

1243

continue

1243

continue

1244

m = subm._matches_inner(match)

1244

m = subm._matches_inner(match)

1245

if not m._isempty():

1245

if not m._isempty():

1246

ret._dirs[dir] = m

1246

ret._dirs[dir] = m

1247

1248

if not ret._isempty():

1248

if not ret._isempty():

1249

ret._dirty = True

1249

ret._dirty = True

1250

return ret

1250

return ret

1251

1252

def fastdelta(self, base, changes):

1252

def fastdelta(self, base, changes):

1253

raise FastdeltaUnavailable()

1253

raise FastdeltaUnavailable()

1254

1255

def diff(self, m2, match=None, clean=False):

1255

def diff(self, m2, match=None, clean=False):

1256

"""Finds changes between the current manifest and m2.

1256

"""Finds changes between the current manifest and m2.

1257

1258

Args:

1258

Args:

1259

m2: the manifest to which this manifest should be compared.

1259

m2: the manifest to which this manifest should be compared.

1260

clean: if true, include files unchanged between these manifests

1260

clean: if true, include files unchanged between these manifests

1261

with a None value in the returned dictionary.

1261

with a None value in the returned dictionary.

1262

1263

The result is returned as a dict with filename as key and

1263

The result is returned as a dict with filename as key and

1264

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

1264

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

1265

nodeid in the current/other manifest and fl1/fl2 is the flag

1265

nodeid in the current/other manifest and fl1/fl2 is the flag

1266

in the current/other manifest. Where the file does not exist,

1266

in the current/other manifest. Where the file does not exist,

1267

the nodeid will be None and the flags will be the empty

1267

the nodeid will be None and the flags will be the empty

1268

string.

1268

string.

1269

"""

1269

"""

1270

if match and not match.always():

1270

if match and not match.always():

1271

m1 = self._matches(match)

1271

m1 = self._matches(match)

1272

m2 = m2._matches(match)

1272

m2 = m2._matches(match)

1273

return m1.diff(m2, clean=clean)

1273

return m1.diff(m2, clean=clean)

1274

result = {}

1274

result = {}

1275

emptytree = treemanifest()

1275

emptytree = treemanifest()

1276

1277

def _iterativediff(t1, t2, stack):

1277

def _iterativediff(t1, t2, stack):

1278

"""compares two tree manifests and append new tree-manifests which

1278

"""compares two tree manifests and append new tree-manifests which

1279

needs to be compared to stack"""

1279

needs to be compared to stack"""

1280

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1280

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1281

return

1281

return

1282

t1._load()

1282

t1._load()

1283

t2._load()

1283

t2._load()

1284

self._loaddifflazy(t1, t2)

1284

self._loaddifflazy(t1, t2)

1285

1286

for d, m1 in pycompat.iteritems(t1._dirs):

1286

for d, m1 in pycompat.iteritems(t1._dirs):

1287

m2 = t2._dirs.get(d, emptytree)

1287

m2 = t2._dirs.get(d, emptytree)

1288

stack.append((m1, m2))

1288

stack.append((m1, m2))

1289

1290

for d, m2 in pycompat.iteritems(t2._dirs):

1290

for d, m2 in pycompat.iteritems(t2._dirs):

1291

if d not in t1._dirs:

1291

if d not in t1._dirs:

1292

stack.append((emptytree, m2))

1292

stack.append((emptytree, m2))

1293

1294

for fn, n1 in pycompat.iteritems(t1._files):

1294

for fn, n1 in pycompat.iteritems(t1._files):

1295

fl1 = t1._flags.get(fn, b'')

1295

fl1 = t1._flags.get(fn, b'')

1296

n2 = t2._files.get(fn, None)

1296

n2 = t2._files.get(fn, None)

1297

fl2 = t2._flags.get(fn, b'')

1297

fl2 = t2._flags.get(fn, b'')

1298

if n1 != n2 or fl1 != fl2:

1298

if n1 != n2 or fl1 != fl2:

1299

result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))

1299

result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))

1300

elif clean:

1300

elif clean:

1301

result[t1._subpath(fn)] = None

1301

result[t1._subpath(fn)] = None

1302

1303

for fn, n2 in pycompat.iteritems(t2._files):

1303

for fn, n2 in pycompat.iteritems(t2._files):

1304

if fn not in t1._files:

1304

if fn not in t1._files:

1305

fl2 = t2._flags.get(fn, b'')

1305

fl2 = t2._flags.get(fn, b'')

1306

result[t2._subpath(fn)] = ((None, b''), (n2, fl2))

1306

result[t2._subpath(fn)] = ((None, b''), (n2, fl2))

1307

1308

stackls = []

1308

stackls = []

1309

_iterativediff(self, m2, stackls)

1309

_iterativediff(self, m2, stackls)

1310

while stackls:

1310

while stackls:

1311

t1, t2 = stackls.pop()

1311

t1, t2 = stackls.pop()

1312

# stackls is populated in the function call

1312

# stackls is populated in the function call

1313

_iterativediff(t1, t2, stackls)

1313

_iterativediff(t1, t2, stackls)

1314

return result

1314

return result

1315

1316

def unmodifiedsince(self, m2):

1316

def unmodifiedsince(self, m2):

1317

return not self._dirty and not m2._dirty and self._node == m2._node

1317

return not self._dirty and not m2._dirty and self._node == m2._node

1318

1319

def parse(self, text, readsubtree):

1319

def parse(self, text, readsubtree):

1320

selflazy = self._lazydirs

1320

selflazy = self._lazydirs

1321

for f, n, fl in _parse(text):

1321

for f, n, fl in _parse(text):

1322

if fl == b't':

1322

if fl == b't':

1323

f = f + b'/'

1323

f = f + b'/'

1324

# False below means "doesn't need to be copied" and can use the

1324

# False below means "doesn't need to be copied" and can use the

1325

# cached value from readsubtree directly.

1325

# cached value from readsubtree directly.

1326

selflazy[f] = (n, readsubtree, False)

1326

selflazy[f] = (n, readsubtree, False)

1327

elif b'/' in f:

1327

elif b'/' in f:

1328

# This is a flat manifest, so use __setitem__ and setflag rather

1328

# This is a flat manifest, so use __setitem__ and setflag rather

1329

# than assigning directly to _files and _flags, so we can

1329

# than assigning directly to _files and _flags, so we can

1330

# assign a path in a subdirectory, and to mark dirty (compared

1330

# assign a path in a subdirectory, and to mark dirty (compared

1331

# to nullid).

1331

# to nullid).

1332

self[f] = n

1332

self[f] = n

1333

if fl:

1333

if fl:

1334

self.setflag(f, fl)

1334

self.setflag(f, fl)

1335

else:

1335

else:

1336

# Assigning to _files and _flags avoids marking as dirty,

1336

# Assigning to _files and _flags avoids marking as dirty,

1337

# and should be a little faster.

1337

# and should be a little faster.

1338

self._files[f] = n

1338

self._files[f] = n

1339

if fl:

1339

if fl:

1340

self._flags[f] = fl

1340

self._flags[f] = fl

1341

1342

def text(self):

1342

def text(self):

1343

"""Get the full data of this manifest as a bytestring."""

1343

"""Get the full data of this manifest as a bytestring."""

1344

self._load()

1344

self._load()

1345

return _text(self.iterentries())

1345

return _text(self.iterentries())

1346

1347

def dirtext(self):

1347

def dirtext(self):

1348

"""Get the full data of this directory as a bytestring. Make sure that

1348

"""Get the full data of this directory as a bytestring. Make sure that

1349

any submanifests have been written first, so their nodeids are correct.

1349

any submanifests have been written first, so their nodeids are correct.

1350

"""

1350

"""

1351

self._load()

1351

self._load()

1352

flags = self.flags

1352

flags = self.flags

1353

lazydirs = [

1353

lazydirs = [

1354

(d[:-1], v[0], b't') for d, v in pycompat.iteritems(self._lazydirs)

1354

(d[:-1], v[0], b't') for d, v in pycompat.iteritems(self._lazydirs)

1355

]

1355

]

1356

dirs = [(d[:-1], self._dirs[d]._node, b't') for d in self._dirs]

1356

dirs = [(d[:-1], self._dirs[d]._node, b't') for d in self._dirs]

1357

files = [(f, self._files[f], flags(f)) for f in self._files]

1357

files = [(f, self._files[f], flags(f)) for f in self._files]

1358

return _text(sorted(dirs + files + lazydirs))

1358

return _text(sorted(dirs + files + lazydirs))

1359

1360

def read(self, gettext, readsubtree):

1360

def read(self, gettext, readsubtree):

1361

def _load_for_read(s):

1361

def _load_for_read(s):

1362

s.parse(gettext(), readsubtree)

1362

s.parse(gettext(), readsubtree)

1363

s._dirty = False

1363

s._dirty = False

1364

1365

self._loadfunc = _load_for_read

1365

self._loadfunc = _load_for_read

1366

1367

def writesubtrees(self, m1, m2, writesubtree, match):

1367

def writesubtrees(self, m1, m2, writesubtree, match):

1368

self._load() # for consistency; should never have any effect here

1368

self._load() # for consistency; should never have any effect here

1369

m1._load()

1369

m1._load()

1370

m2._load()

1370

m2._load()

1371

emptytree = treemanifest()

1371

emptytree = treemanifest()

1372

1373

def getnode(m, d):

1373

def getnode(m, d):

1374

ld = m._lazydirs.get(d)

1374

ld = m._lazydirs.get(d)

1375

if ld:

1375

if ld:

1376

return ld[0]

1376

return ld[0]

1377

return m._dirs.get(d, emptytree)._node

1377

return m._dirs.get(d, emptytree)._node

1378

1379

# let's skip investigating things that `match` says we do not need.

1379

# let's skip investigating things that `match` says we do not need.

1380

visit = match.visitchildrenset(self._dir[:-1])

1380

visit = match.visitchildrenset(self._dir[:-1])

1381

visit = self._loadchildrensetlazy(visit)

1381

visit = self._loadchildrensetlazy(visit)

1382

if visit == b'this' or visit == b'all':

1382

if visit == b'this' or visit == b'all':

1383

visit = None

1383

visit = None

1384

for d, subm in pycompat.iteritems(self._dirs):

1384

for d, subm in pycompat.iteritems(self._dirs):

1385

if visit and d[:-1] not in visit:

1385

if visit and d[:-1] not in visit:

1386

continue

1386

continue

1387

subp1 = getnode(m1, d)

1387

subp1 = getnode(m1, d)

1388

subp2 = getnode(m2, d)

1388

subp2 = getnode(m2, d)

1389

if subp1 == nullid:

1389

if subp1 == nullid:

1390

subp1, subp2 = subp2, subp1

1390

subp1, subp2 = subp2, subp1

1391

writesubtree(subm, subp1, subp2, match)

1391

writesubtree(subm, subp1, subp2, match)

1392

1393

def walksubtrees(self, matcher=None):

1393

def walksubtrees(self, matcher=None):

1394

"""Returns an iterator of the subtrees of this manifest, including this

1394

"""Returns an iterator of the subtrees of this manifest, including this

1395

manifest itself.

1395

manifest itself.

1396

1397

If `matcher` is provided, it only returns subtrees that match.

1397

If `matcher` is provided, it only returns subtrees that match.

1398

"""

1398

"""

1399

if matcher and not matcher.visitdir(self._dir[:-1]):

1399

if matcher and not matcher.visitdir(self._dir[:-1]):

1400

return

1400

return

1401

if not matcher or matcher(self._dir[:-1]):

1401

if not matcher or matcher(self._dir[:-1]):

1402

yield self

1402

yield self

1403

1404

self._load()

1404

self._load()

1405

# OPT: use visitchildrenset to avoid loading everything.

1405

# OPT: use visitchildrenset to avoid loading everything.

1406

self._loadalllazy()

1406

self._loadalllazy()

1407

for d, subm in pycompat.iteritems(self._dirs):

1407

for d, subm in pycompat.iteritems(self._dirs):

1408

for subtree in subm.walksubtrees(matcher=matcher):

1408

for subtree in subm.walksubtrees(matcher=matcher):

1409

yield subtree

1409

yield subtree

1410

1411

1412

class manifestfulltextcache(util.lrucachedict):

1412

class manifestfulltextcache(util.lrucachedict):

1413

"""File-backed LRU cache for the manifest cache

1413

"""File-backed LRU cache for the manifest cache

1414

1415

File consists of entries, up to EOF:

1415

File consists of entries, up to EOF:

1416

1417

- 20 bytes node, 4 bytes length, <length> manifest data

1417

- 20 bytes node, 4 bytes length, <length> manifest data

1418

1419

These are written in reverse cache order (oldest to newest).

1419

These are written in reverse cache order (oldest to newest).

1420

1421

"""

1421

"""

1422

1423

_file = b'manifestfulltextcache'

1423

_file = b'manifestfulltextcache'

1424

1425

def __init__(self, max):

1425

def __init__(self, max):

1426

super(manifestfulltextcache, self).__init__(max)

1426

super(manifestfulltextcache, self).__init__(max)

1427

self._dirty = False

1427

self._dirty = False

1428

self._read = False

1428

self._read = False

1429

self._opener = None

1429

self._opener = None

1430

1431

def read(self):

1431

def read(self):

1432

if self._read or self._opener is None:

1432

if self._read or self._opener is None:

1433

return

1433

return

1434

1435

try:

1435

try:

1436

with self._opener(self._file) as fp:

1436

with self._opener(self._file) as fp:

1437

set = super(manifestfulltextcache, self).__setitem__

1437

set = super(manifestfulltextcache, self).__setitem__

1438

# ignore trailing data, this is a cache, corruption is skipped

1438

# ignore trailing data, this is a cache, corruption is skipped

1439

while True:

1439

while True:

1440

# TODO do we need to do work here for sha1 portability?

1440

# TODO do we need to do work here for sha1 portability?

1441

node = fp.read(20)

1441

node = fp.read(20)

1442

if len(node) < 20:

1442

if len(node) < 20:

1443

break

1443

break

1444

try:

1444

try:

1445

size = struct.unpack(b'>L', fp.read(4))[0]

1445

size = struct.unpack(b'>L', fp.read(4))[0]

1446

except struct.error:

1446

except struct.error:

1447

break

1447

break

1448

value = bytearray(fp.read(size))

1448

value = bytearray(fp.read(size))

1449

if len(value) != size:

1449

if len(value) != size:

1450

break

1450

break

1451

set(node, value)

1451

set(node, value)

1452

except IOError:

1452

except IOError:

1453

# the file is allowed to be missing

1453

# the file is allowed to be missing

1454

pass

1454

pass

1455

1456

self._read = True

1456

self._read = True

1457

self._dirty = False

1457

self._dirty = False

1458

1459

def write(self):

1459

def write(self):

1460

if not self._dirty or self._opener is None:

1460

if not self._dirty or self._opener is None:

1461

return

1461

return

1462

# rotate backwards to the first used node

1462

# rotate backwards to the first used node

1463

try:

1463

try:

1464

with self._opener(

1464

with self._opener(

1465

self._file, b'w', atomictemp=True, checkambig=True

1465

self._file, b'w', atomictemp=True, checkambig=True

1466

) as fp:

1466

) as fp:

1467

node = self._head.prev

1467

node = self._head.prev

1468

while True:

1468

while True:

1469

if node.key in self._cache:

1469

if node.key in self._cache:

1470

fp.write(node.key)

1470

fp.write(node.key)

1471

fp.write(struct.pack(b'>L', len(node.value)))

1471

fp.write(struct.pack(b'>L', len(node.value)))

1472

fp.write(node.value)

1472

fp.write(node.value)

1473

if node is self._head:

1473

if node is self._head:

1474

break

1474

break

1475

node = node.prev

1475

node = node.prev

1476

except IOError:

1476

except IOError:

1477

# We could not write the cache (eg: permission error)

1477

# We could not write the cache (eg: permission error)

1478

# the content can be missing.

1478

# the content can be missing.

1479

#

1479

#

1480

# We could try harder and see if we could recreate a wcache

1480

# We could try harder and see if we could recreate a wcache

1481

# directory were we coudl write too.

1481

# directory were we coudl write too.

1482

#

1482

#

1483

# XXX the error pass silently, having some way to issue an error

1483

# XXX the error pass silently, having some way to issue an error

1484

# log `ui.log` would be nice.

1484

# log `ui.log` would be nice.

1485

pass

1485

pass

1486

1487

def __len__(self):

1487

def __len__(self):

1488

if not self._read:

1488

if not self._read:

1489

self.read()

1489

self.read()

1490

return super(manifestfulltextcache, self).__len__()

1490

return super(manifestfulltextcache, self).__len__()

1491

1492

def __contains__(self, k):

1492

def __contains__(self, k):

1493

if not self._read:

1493

if not self._read:

1494

self.read()

1494

self.read()

1495

return super(manifestfulltextcache, self).__contains__(k)

1495

return super(manifestfulltextcache, self).__contains__(k)

1496

1497

def __iter__(self):

1497

def __iter__(self):

1498

if not self._read:

1498

if not self._read:

1499

self.read()

1499

self.read()

1500

return super(manifestfulltextcache, self).__iter__()

1500

return super(manifestfulltextcache, self).__iter__()

1501

1502

def __getitem__(self, k):

1502

def __getitem__(self, k):

1503

if not self._read:

1503

if not self._read:

1504

self.read()

1504

self.read()

1505

# the cache lru order can change on read

1505

# the cache lru order can change on read

1506

setdirty = self._cache.get(k) is not self._head

1506

setdirty = self._cache.get(k) is not self._head

1507

value = super(manifestfulltextcache, self).__getitem__(k)

1507

value = super(manifestfulltextcache, self).__getitem__(k)

1508

if setdirty:

1508

if setdirty:

1509

self._dirty = True

1509

self._dirty = True

1510

return value

1510

return value

1511

1512

def __setitem__(self, k, v):

1512

def __setitem__(self, k, v):

1513

if not self._read:

1513

if not self._read:

1514

self.read()

1514

self.read()

1515

super(manifestfulltextcache, self).__setitem__(k, v)

1515

super(manifestfulltextcache, self).__setitem__(k, v)

1516

self._dirty = True

1516

self._dirty = True

1517

1518

def __delitem__(self, k):

1518

def __delitem__(self, k):

1519

if not self._read:

1519

if not self._read:

1520

self.read()

1520

self.read()

1521

super(manifestfulltextcache, self).__delitem__(k)

1521

super(manifestfulltextcache, self).__delitem__(k)

1522

self._dirty = True

1522

self._dirty = True

1523

1524

def get(self, k, default=None):

1524

def get(self, k, default=None):

1525

if not self._read:

1525

if not self._read:

1526

self.read()

1526

self.read()

1527

return super(manifestfulltextcache, self).get(k, default=default)

1527

return super(manifestfulltextcache, self).get(k, default=default)

1528

1529

def clear(self, clear_persisted_data=False):

1529

def clear(self, clear_persisted_data=False):

1530

super(manifestfulltextcache, self).clear()

1530

super(manifestfulltextcache, self).clear()

1531

if clear_persisted_data:

1531

if clear_persisted_data:

1532

self._dirty = True

1532

self._dirty = True

1533

self.write()

1533

self.write()

1534

self._read = False

1534

self._read = False

1535

1536

1537

# and upper bound of what we expect from compression

1537

# and upper bound of what we expect from compression

1538

# (real live value seems to be "3")

1538

# (real live value seems to be "3")

1539

MAXCOMPRESSION = 3

1539

MAXCOMPRESSION = 3

1540

1541

1542

class FastdeltaUnavailable(Exception):

1542

class FastdeltaUnavailable(Exception):

1543

"""Exception raised when fastdelta isn't usable on a manifest."""

1543

"""Exception raised when fastdelta isn't usable on a manifest."""

1544

1545

1546

@interfaceutil.implementer(repository.imanifeststorage)

1546

@interfaceutil.implementer(repository.imanifeststorage)

1547

class manifestrevlog(object):

1547

class manifestrevlog(object):

1548

"""A revlog that stores manifest texts. This is responsible for caching the

1548

"""A revlog that stores manifest texts. This is responsible for caching the

1549

full-text manifest contents.

1549

full-text manifest contents.

1550

"""

1550

"""

1551

1552

def __init__(

1552

def __init__(

1553

self,

1553

self,

1554

opener,

1554

opener,

1555

tree=b'',

1555

tree=b'',

1556

dirlogcache=None,

1556

dirlogcache=None,

1557

indexfile=None,

1557

indexfile=None,

1558

treemanifest=False,

1558

treemanifest=False,

1559

):

1559

):

1560

"""Constructs a new manifest revlog

1560

"""Constructs a new manifest revlog

1561

1562

`indexfile` - used by extensions to have two manifests at once, like

1562

`indexfile` - used by extensions to have two manifests at once, like

1563

when transitioning between flatmanifeset and treemanifests.

1563

when transitioning between flatmanifeset and treemanifests.

1564

1565

`treemanifest` - used to indicate this is a tree manifest revlog. Opener

1565

`treemanifest` - used to indicate this is a tree manifest revlog. Opener

1566

options can also be used to make this a tree manifest revlog. The opener

1566

options can also be used to make this a tree manifest revlog. The opener

1567

option takes precedence, so if it is set to True, we ignore whatever

1567

option takes precedence, so if it is set to True, we ignore whatever

1568

value is passed in to the constructor.

1568

value is passed in to the constructor.

1569

"""

1569

"""

1570

# During normal operations, we expect to deal with not more than four

1570

# During normal operations, we expect to deal with not more than four

1571

# revs at a time (such as during commit --amend). When rebasing large

1571

# revs at a time (such as during commit --amend). When rebasing large

1572

# stacks of commits, the number can go up, hence the config knob below.

1572

# stacks of commits, the number can go up, hence the config knob below.

1573

cachesize = 4

1573

cachesize = 4

1574

optiontreemanifest = False

1574

optiontreemanifest = False

1575

opts = getattr(opener, 'options', None)

1575

opts = getattr(opener, 'options', None)

1576

if opts is not None:

1576

if opts is not None:

1577

cachesize = opts.get(b'manifestcachesize', cachesize)

1577

cachesize = opts.get(b'manifestcachesize', cachesize)

1578

optiontreemanifest = opts.get(b'treemanifest', False)

1578

optiontreemanifest = opts.get(b'treemanifest', False)

1579

1580

self._treeondisk = optiontreemanifest or treemanifest

1580

self._treeondisk = optiontreemanifest or treemanifest

1581

1582

self._fulltextcache = manifestfulltextcache(cachesize)

1582

self._fulltextcache = manifestfulltextcache(cachesize)

1583

1584

if tree:

1584

if tree:

1585

assert self._treeondisk, b'opts is %r' % opts

1585

assert self._treeondisk, b'opts is %r' % opts

1586

1587

if indexfile is None:

1587

if indexfile is None:

1588

indexfile = b'00manifest.i'

1588

indexfile = b'00manifest.i'

1589

if tree:

1589

if tree:

1590

indexfile = b"meta/" + tree + indexfile

1590

indexfile = b"meta/" + tree + indexfile

1591

1592

self.tree = tree

1592

self.tree = tree

1593

1594

# The dirlogcache is kept on the root manifest log

1594

# The dirlogcache is kept on the root manifest log

1595

if tree:

1595

if tree:

1596

self._dirlogcache = dirlogcache

1596

self._dirlogcache = dirlogcache

1597

else:

1597

else:

1598

self._dirlogcache = {b'': self}

1598

self._dirlogcache = {b'': self}

1599

1600

self._revlog = revlog.revlog(

1600

self._revlog = revlog.revlog(

1601

opener,

1601

opener,

1602

indexfile,

1602

indexfile,

1603

# only root indexfile is cached

1603

# only root indexfile is cached

1604

checkambig=not bool(tree),

1604

checkambig=not bool(tree),

1605

mmaplargeindex=True,

1605

mmaplargeindex=True,

1606

upperboundcomp=MAXCOMPRESSION,

1606

upperboundcomp=MAXCOMPRESSION,

1607

persistentnodemap=opener.options.get(b'persistent-nodemap', False),

1607

persistentnodemap=opener.options.get(b'persistent-nodemap', False),

1608

)

1608

)

1609

1610

self.index = self._revlog.index

1610

self.index = self._revlog.index

1611

self.version = self._revlog.version

1611

self.version = self._revlog.version

1612

self._generaldelta = self._revlog._generaldelta

1612

self._generaldelta = self._revlog._generaldelta

1613

1614

def _setupmanifestcachehooks(self, repo):

1614

def _setupmanifestcachehooks(self, repo):

1615

"""Persist the manifestfulltextcache on lock release"""

1615

"""Persist the manifestfulltextcache on lock release"""

1616

if not util.safehasattr(repo, b'_wlockref'):

1616

if not util.safehasattr(repo, b'_wlockref'):

1617

return

1617

return

1618

1619

self._fulltextcache._opener = repo.wcachevfs

1619

self._fulltextcache._opener = repo.wcachevfs

1620

if repo._currentlock(repo._wlockref) is None:

1620

if repo._currentlock(repo._wlockref) is None:

1621

return

1621

return

1622

1623

reporef = weakref.ref(repo)

1623

reporef = weakref.ref(repo)

1624

manifestrevlogref = weakref.ref(self)

1624

manifestrevlogref = weakref.ref(self)

1625

1626

def persistmanifestcache(success):

1626

def persistmanifestcache(success):

1627

# Repo is in an unknown state, do not persist.

1627

# Repo is in an unknown state, do not persist.

1628

if not success:

1628

if not success:

1629

return

1629

return

1630

1631

repo = reporef()

1631

repo = reporef()

1632

self = manifestrevlogref()

1632

self = manifestrevlogref()

1633

if repo is None or self is None:

1633

if repo is None or self is None:

1634

return

1634

return

1635

if repo.manifestlog.getstorage(b'') is not self:

1635

if repo.manifestlog.getstorage(b'') is not self:

1636

# there's a different manifest in play now, abort

1636

# there's a different manifest in play now, abort

1637

return

1637

return

1638

self._fulltextcache.write()

1638

self._fulltextcache.write()

1639

1640

repo._afterlock(persistmanifestcache)

1640

repo._afterlock(persistmanifestcache)

1641

1642

@property

1642

@property

1643

def fulltextcache(self):

1643

def fulltextcache(self):

1644

return self._fulltextcache

1644

return self._fulltextcache

1645

1646

def clearcaches(self, clear_persisted_data=False):

1646

def clearcaches(self, clear_persisted_data=False):

1647

self._revlog.clearcaches()

1647

self._revlog.clearcaches()

1648

self._fulltextcache.clear(clear_persisted_data=clear_persisted_data)

1648

self._fulltextcache.clear(clear_persisted_data=clear_persisted_data)

1649

self._dirlogcache = {self.tree: self}

1649

self._dirlogcache = {self.tree: self}

1650

1651

def dirlog(self, d):

1651

def dirlog(self, d):

1652

if d:

1652

if d:

1653

assert self._treeondisk

1653

assert self._treeondisk

1654

if d not in self._dirlogcache:

1654

if d not in self._dirlogcache:

1655

mfrevlog = manifestrevlog(

1655

mfrevlog = manifestrevlog(

1656

self.opener, d, self._dirlogcache, treemanifest=self._treeondisk

1656

self.opener, d, self._dirlogcache, treemanifest=self._treeondisk

1657

)

1657

)

1658

self._dirlogcache[d] = mfrevlog

1658

self._dirlogcache[d] = mfrevlog

1659

return self._dirlogcache[d]

1659

return self._dirlogcache[d]

1660

1661

def add(

1661

def add(

1662

self,

1662

self,

1663

m,

1663

m,

1664

transaction,

1664

transaction,

1665

link,

1665

link,

1666

p1,

1666

p1,

1667

p2,

1667

p2,

1668

added,

1668

added,

1669

removed,

1669

removed,

1670

readtree=None,

1670

readtree=None,

1671

match=None,

1671

match=None,

1672

):

1672

):

1673

"""add some manifest entry in to the manifest log

1673

"""add some manifest entry in to the manifest log

1674

1675

input:

1675

input:

1676

1677

m: the manifest dict we want to store

1677

m: the manifest dict we want to store

1678

transaction: the open transaction

1678

transaction: the open transaction

1679

p1: manifest-node of p1

1679

p1: manifest-node of p1

1680

p2: manifest-node of p2

1680

p2: manifest-node of p2

1681

added: file added/changed compared to parent

1681

added: file added/changed compared to parent

1682

removed: file removed compared to parent

1682

removed: file removed compared to parent

1683

1684

tree manifest input:

1684

tree manifest input:

1685

1686

readtree: a function to read a subtree

1686

readtree: a function to read a subtree

1687

match: a filematcher for the subpart of the tree manifest

1687

match: a filematcher for the subpart of the tree manifest

1688

"""

1688

"""

1689

try:

1689

try:

1690

if p1 not in self.fulltextcache:

1690

if p1 not in self.fulltextcache:

1691

raise FastdeltaUnavailable()

1691

raise FastdeltaUnavailable()

1692

# If our first parent is in the manifest cache, we can

1692

# If our first parent is in the manifest cache, we can

1693

# compute a delta here using properties we know about the

1693

# compute a delta here using properties we know about the

1694

# manifest up-front, which may save time later for the

1694

# manifest up-front, which may save time later for the

1695

# revlog layer.

1695

# revlog layer.

1696

1697

_checkforbidden(added)

1697

_checkforbidden(added)

1698

# combine the changed lists into one sorted iterator

1698

# combine the changed lists into one sorted iterator

1699

work = heapq.merge(

1699

work = heapq.merge(

1700

[(x, False) for x in sorted(added)],

1700

[(x, False) for x in sorted(added)],

1701

[(x, True) for x in sorted(removed)],

1701

[(x, True) for x in sorted(removed)],

1702

)

1702

)

1703

1704

arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)

1704

arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)

1705

cachedelta = self._revlog.rev(p1), deltatext

1705

cachedelta = self._revlog.rev(p1), deltatext

1706

text = util.buffer(arraytext)

1706

text = util.buffer(arraytext)

1707

n = self._revlog.addrevision(

1707

n = self._revlog.addrevision(

1708

text, transaction, link, p1, p2, cachedelta

1708

text, transaction, link, p1, p2, cachedelta

1709

)

1709

)

1710

except FastdeltaUnavailable:

1710

except FastdeltaUnavailable:

1711

# The first parent manifest isn't already loaded or the

1711

# The first parent manifest isn't already loaded or the

1712

# manifest implementation doesn't support fastdelta, so

1712

# manifest implementation doesn't support fastdelta, so

1713

# we'll just encode a fulltext of the manifest and pass

1713

# we'll just encode a fulltext of the manifest and pass

1714

# that through to the revlog layer, and let it handle the

1714

# that through to the revlog layer, and let it handle the

1715

# delta process.

1715

# delta process.

1716

if self._treeondisk:

1716

if self._treeondisk:

1717

assert readtree, b"readtree must be set for treemanifest writes"

1717

assert readtree, b"readtree must be set for treemanifest writes"

1718

assert match, b"match must be specified for treemanifest writes"

1718

assert match, b"match must be specified for treemanifest writes"

1719

m1 = readtree(self.tree, p1)

1719

m1 = readtree(self.tree, p1)

1720

m2 = readtree(self.tree, p2)

1720

m2 = readtree(self.tree, p2)

1721

n = self._addtree(

1721

n = self._addtree(

1722

m, transaction, link, m1, m2, readtree, match=match

1722

m, transaction, link, m1, m2, readtree, match=match

1723

)

1723

)

1724

arraytext = None

1724

arraytext = None

1725

else:

1725

else:

1726

text = m.text()

1726

text = m.text()

1727

n = self._revlog.addrevision(text, transaction, link, p1, p2)

1727

n = self._revlog.addrevision(text, transaction, link, p1, p2)

1728

arraytext = bytearray(text)

1728

arraytext = bytearray(text)

1729

1730

if arraytext is not None:

1730

if arraytext is not None:

1731

self.fulltextcache[n] = arraytext

1731

self.fulltextcache[n] = arraytext

1732

1733

return n

1733

return n

1734

1735

def _addtree(self, m, transaction, link, m1, m2, readtree, match):

1735

def _addtree(self, m, transaction, link, m1, m2, readtree, match):

1736

# If the manifest is unchanged compared to one parent,

1736

# If the manifest is unchanged compared to one parent,

1737

# don't write a new revision

1737

# don't write a new revision

1738

if self.tree != b'' and (

1738

if self.tree != b'' and (

1739

m.unmodifiedsince(m1) or m.unmodifiedsince(m2)

1739

m.unmodifiedsince(m1) or m.unmodifiedsince(m2)

1740

):

1740

):

1741

return m.node()

1741

return m.node()

1742

1743

def writesubtree(subm, subp1, subp2, match):

1743

def writesubtree(subm, subp1, subp2, match):

1744

sublog = self.dirlog(subm.dir())

1744

sublog = self.dirlog(subm.dir())

1745

sublog.add(

1745

sublog.add(

1746

subm,

1746

subm,

1747

transaction,

1747

transaction,

1748

link,

1748

link,

1749

subp1,

1749

subp1,

1750

subp2,

1750

subp2,

1751

None,

1751

None,

1752

None,

1752

None,

1753

readtree=readtree,

1753

readtree=readtree,

1754

match=match,

1754

match=match,

1755

)

1755

)

1756

1757

m.writesubtrees(m1, m2, writesubtree, match)

1757

m.writesubtrees(m1, m2, writesubtree, match)

1758

text = m.dirtext()

1758

text = m.dirtext()

1759

n = None

1759

n = None

1760

if self.tree != b'':

1760

if self.tree != b'':

1761

# Double-check whether contents are unchanged to one parent

1761

# Double-check whether contents are unchanged to one parent

1762

if text == m1.dirtext():

1762

if text == m1.dirtext():

1763

n = m1.node()

1763

n = m1.node()

1764

elif text == m2.dirtext():

1764

elif text == m2.dirtext():

1765

n = m2.node()

1765

n = m2.node()

1766

1767

if not n:

1767

if not n:

1768

n = self._revlog.addrevision(

1768

n = self._revlog.addrevision(

1769

text, transaction, link, m1.node(), m2.node()

1769

text, transaction, link, m1.node(), m2.node()

1770

)

1770

)

1771

1772

# Save nodeid so parent manifest can calculate its nodeid

1772

# Save nodeid so parent manifest can calculate its nodeid

1773

m.setnode(n)

1773

m.setnode(n)

1774

return n

1774

return n

1775

1776

def __len__(self):

1776

def __len__(self):

1777

return len(self._revlog)

1777

return len(self._revlog)

1778

1779

def __iter__(self):

1779

def __iter__(self):

1780

return self._revlog.__iter__()

1780

return self._revlog.__iter__()

1781

1782

def rev(self, node):

1782

def rev(self, node):

1783

return self._revlog.rev(node)

1783

return self._revlog.rev(node)

1784

1785

def node(self, rev):

1785

def node(self, rev):

1786

return self._revlog.node(rev)

1786

return self._revlog.node(rev)

1787

1788

def lookup(self, value):

1788

def lookup(self, value):

1789

return self._revlog.lookup(value)

1789

return self._revlog.lookup(value)

1790

1791

def parentrevs(self, rev):

1791

def parentrevs(self, rev):

1792

return self._revlog.parentrevs(rev)

1792

return self._revlog.parentrevs(rev)

1793

1794

def parents(self, node):

1794

def parents(self, node):

1795

return self._revlog.parents(node)

1795

return self._revlog.parents(node)

1796

1797

def linkrev(self, rev):

1797

def linkrev(self, rev):

1798

return self._revlog.linkrev(rev)

1798

return self._revlog.linkrev(rev)

1799

1800

def checksize(self):

1800

def checksize(self):

1801

return self._revlog.checksize()

1801

return self._revlog.checksize()

1802

1803

def revision(self, node, _df=None, raw=False):

1803

def revision(self, node, _df=None, raw=False):

1804

return self._revlog.revision(node, _df=_df, raw=raw)

1804

return self._revlog.revision(node, _df=_df, raw=raw)

1805

1806

def rawdata(self, node, _df=None):

1806

def rawdata(self, node, _df=None):

1807

return self._revlog.rawdata(node, _df=_df)

1807

return self._revlog.rawdata(node, _df=_df)

1808

1809

def revdiff(self, rev1, rev2):

1809

def revdiff(self, rev1, rev2):

1810

return self._revlog.revdiff(rev1, rev2)

1810

return self._revlog.revdiff(rev1, rev2)

1811

1812

def cmp(self, node, text):

1812

def cmp(self, node, text):

1813

return self._revlog.cmp(node, text)

1813

return self._revlog.cmp(node, text)

1814

1815

def deltaparent(self, rev):

1815

def deltaparent(self, rev):

1816

return self._revlog.deltaparent(rev)

1816

return self._revlog.deltaparent(rev)

1817

1818

def emitrevisions(

1818

def emitrevisions(

1819

self,

1819

self,

1820

nodes,

1820

nodes,

1821

nodesorder=None,

1821

nodesorder=None,

1822

revisiondata=False,

1822

revisiondata=False,

1823

assumehaveparentrevisions=False,

1823

assumehaveparentrevisions=False,

1824

deltamode=repository.CG_DELTAMODE_STD,

1824

deltamode=repository.CG_DELTAMODE_STD,

1825

):

1825

):

1826

return self._revlog.emitrevisions(

1826

return self._revlog.emitrevisions(

1827

nodes,

1827

nodes,

1828

nodesorder=nodesorder,

1828

nodesorder=nodesorder,

1829

revisiondata=revisiondata,

1829

revisiondata=revisiondata,

1830

assumehaveparentrevisions=assumehaveparentrevisions,

1830

assumehaveparentrevisions=assumehaveparentrevisions,

1831

deltamode=deltamode,

1831

deltamode=deltamode,

1832

)

1832

)

1833

1834

def addgroup(

1834

def addgroup(

1835

self,

1835

self,

1836

deltas,

1836

deltas,

1837

linkmapper,

1837

linkmapper,

1838

transaction,

1838

transaction,

1839

addrevisioncb=None,

1839

addrevisioncb=None,

1840

duplicaterevisioncb=None,

1840

duplicaterevisioncb=None,

1841

):

1841

):

1842

return self._revlog.addgroup(

1842

return self._revlog.addgroup(

1843

deltas,

1843

deltas,

1844

linkmapper,

1844

linkmapper,

1845

transaction,

1845

transaction,

1846

addrevisioncb=addrevisioncb,

1846

addrevisioncb=addrevisioncb,

1847

duplicaterevisioncb=duplicaterevisioncb,

1847

duplicaterevisioncb=duplicaterevisioncb,

1848

)

1848

)

1849

1850

def rawsize(self, rev):

1850

def rawsize(self, rev):

1851

return self._revlog.rawsize(rev)

1851

return self._revlog.rawsize(rev)

1852

1853

def getstrippoint(self, minlink):

1853

def getstrippoint(self, minlink):

1854

return self._revlog.getstrippoint(minlink)

1854

return self._revlog.getstrippoint(minlink)

1855

1856

def strip(self, minlink, transaction):

1856

def strip(self, minlink, transaction):

1857

return self._revlog.strip(minlink, transaction)

1857

return self._revlog.strip(minlink, transaction)

1858

1859

def files(self):

1859

def files(self):

1860

return self._revlog.files()

1860

return self._revlog.files()

1861

1862

def clone(self, tr, destrevlog, **kwargs):

1862

def clone(self, tr, destrevlog, **kwargs):

1863

if not isinstance(destrevlog, manifestrevlog):

1863

if not isinstance(destrevlog, manifestrevlog):

1864

raise error.ProgrammingError(b'expected manifestrevlog to clone()')

1864

raise error.ProgrammingError(b'expected manifestrevlog to clone()')

1865

1866

return self._revlog.clone(tr, destrevlog._revlog, **kwargs)

1866

return self._revlog.clone(tr, destrevlog._revlog, **kwargs)

1867

1868

def storageinfo(

1868

def storageinfo(

1869

self,

1869

self,

1870

exclusivefiles=False,

1870

exclusivefiles=False,

1871

sharedfiles=False,

1871

sharedfiles=False,

1872

revisionscount=False,

1872

revisionscount=False,

1873

trackedsize=False,

1873

trackedsize=False,

1874

storedsize=False,

1874

storedsize=False,

1875

):

1875

):

1876

return self._revlog.storageinfo(

1876

return self._revlog.storageinfo(

1877

exclusivefiles=exclusivefiles,

1877

exclusivefiles=exclusivefiles,

1878

sharedfiles=sharedfiles,

1878

sharedfiles=sharedfiles,

1879

revisionscount=revisionscount,

1879

revisionscount=revisionscount,

1880

trackedsize=trackedsize,

1880

trackedsize=trackedsize,

1881

storedsize=storedsize,

1881

storedsize=storedsize,

1882

)

1882

)

1883

1884

@property

1884

@property

1885

def indexfile(self):

1885

def indexfile(self):

1886

return self._revlog.indexfile

1886

return self._revlog.indexfile

1887

1888

@indexfile.setter

1888

@indexfile.setter

1889

def indexfile(self, value):

1889

def indexfile(self, value):

1890

self._revlog.indexfile = value

1890

self._revlog.indexfile = value

1891

1892

@property

1892

@property

1893

def opener(self):

1893

def opener(self):

1894

return self._revlog.opener

1894

return self._revlog.opener

1895

1896

@opener.setter

1896

@opener.setter

1897

def opener(self, value):

1897

def opener(self, value):

1898

self._revlog.opener = value

1898

self._revlog.opener = value

1899

1900

1901

@interfaceutil.implementer(repository.imanifestlog)

1901

@interfaceutil.implementer(repository.imanifestlog)

1902

class manifestlog(object):

1902

class manifestlog(object):

1903

"""A collection class representing the collection of manifest snapshots

1903

"""A collection class representing the collection of manifest snapshots

1904

referenced by commits in the repository.

1904

referenced by commits in the repository.

1905

1906

In this situation, 'manifest' refers to the abstract concept of a snapshot

1906

In this situation, 'manifest' refers to the abstract concept of a snapshot

1907

of the list of files in the given commit. Consumers of the output of this

1907

of the list of files in the given commit. Consumers of the output of this

1908

class do not care about the implementation details of the actual manifests

1908

class do not care about the implementation details of the actual manifests

1909

they receive (i.e. tree or flat or lazily loaded, etc)."""

1909

they receive (i.e. tree or flat or lazily loaded, etc)."""

1910

1911

def __init__(self, opener, repo, rootstore, narrowmatch):

1911

def __init__(self, opener, repo, rootstore, narrowmatch):

1912

usetreemanifest = False

1912

usetreemanifest = False

1913

cachesize = 4

1913

cachesize = 4

1914

1915

opts = getattr(opener, 'options', None)

1915

opts = getattr(opener, 'options', None)

1916

if opts is not None:

1916

if opts is not None:

1917

usetreemanifest = opts.get(b'treemanifest', usetreemanifest)

1917

usetreemanifest = opts.get(b'treemanifest', usetreemanifest)

1918

cachesize = opts.get(b'manifestcachesize', cachesize)

1918

cachesize = opts.get(b'manifestcachesize', cachesize)

1919

1920

self._treemanifests = usetreemanifest

1920

self._treemanifests = usetreemanifest

1921

1922

self._rootstore = rootstore

1922

self._rootstore = rootstore

1923

self._rootstore._setupmanifestcachehooks(repo)

1923

self._rootstore._setupmanifestcachehooks(repo)

1924

self._narrowmatch = narrowmatch

1924

self._narrowmatch = narrowmatch

1925

1926

# A cache of the manifestctx or treemanifestctx for each directory

1926

# A cache of the manifestctx or treemanifestctx for each directory

1927

self._dirmancache = {}

1927

self._dirmancache = {}

1928

self._dirmancache[b''] = util.lrucachedict(cachesize)

1928

self._dirmancache[b''] = util.lrucachedict(cachesize)

1929

1930

self._cachesize = cachesize

1930

self._cachesize = cachesize

1931

1932

def __getitem__(self, node):

1932

def __getitem__(self, node):

1933

"""Retrieves the manifest instance for the given node. Throws a

1933

"""Retrieves the manifest instance for the given node. Throws a

1934

LookupError if not found.

1934

LookupError if not found.

1935

"""

1935

"""

1936

return self.get(b'', node)

1936

return self.get(b'', node)

1937

1938

def get(self, tree, node, verify=True):

1938

def get(self, tree, node, verify=True):

1939

"""Retrieves the manifest instance for the given node. Throws a

1939

"""Retrieves the manifest instance for the given node. Throws a

1940

LookupError if not found.

1940

LookupError if not found.

1941

1942

`verify` - if True an exception will be thrown if the node is not in

1942

`verify` - if True an exception will be thrown if the node is not in

1943

the revlog

1943

the revlog

1944

"""

1944

"""

1945

if node in self._dirmancache.get(tree, ()):

1945

if node in self._dirmancache.get(tree, ()):

1946

return self._dirmancache[tree][node]

1946

return self._dirmancache[tree][node]

1947

1948

if not self._narrowmatch.always():

1948

if not self._narrowmatch.always():

1949

if not self._narrowmatch.visitdir(tree[:-1]):

1949

if not self._narrowmatch.visitdir(tree[:-1]):

1950

return excludeddirmanifestctx(tree, node)

1950

return excludeddirmanifestctx(tree, node)

1951

if tree:

1951

if tree:

1952

if self._rootstore._treeondisk:

1952

if self._rootstore._treeondisk:

1953

if verify:

1953

if verify:

1954

# Side-effect is LookupError is raised if node doesn't

1954

# Side-effect is LookupError is raised if node doesn't

1955

# exist.

1955

# exist.

1956

self.getstorage(tree).rev(node)

1956

self.getstorage(tree).rev(node)

1957

1958

m = treemanifestctx(self, tree, node)

1958

m = treemanifestctx(self, tree, node)

1959

else:

1959

else:

1960

raise error.Abort(

1960

raise error.Abort(

1961

_(

1961

_(

1962

b"cannot ask for manifest directory '%s' in a flat "

1962

b"cannot ask for manifest directory '%s' in a flat "

1963

b"manifest"

1963

b"manifest"

1964

)

1964

)

1965

% tree

1965

% tree

1966

)

1966

)

1967

else:

1967

else:

1968

if verify:

1968

if verify:

1969

# Side-effect is LookupError is raised if node doesn't exist.

1969

# Side-effect is LookupError is raised if node doesn't exist.

1970

self._rootstore.rev(node)

1970

self._rootstore.rev(node)

1971

1972

if self._treemanifests:

1972

if self._treemanifests:

1973

m = treemanifestctx(self, b'', node)

1973

m = treemanifestctx(self, b'', node)

1974

else:

1974

else:

1975

m = manifestctx(self, node)

1975

m = manifestctx(self, node)

1976

1977

if node != nullid:

1977

if node != nullid:

1978

mancache = self._dirmancache.get(tree)

1978

mancache = self._dirmancache.get(tree)

1979

if not mancache:

1979

if not mancache:

1980

mancache = util.lrucachedict(self._cachesize)

1980

mancache = util.lrucachedict(self._cachesize)

1981

self._dirmancache[tree] = mancache

1981

self._dirmancache[tree] = mancache

1982

mancache[node] = m

1982

mancache[node] = m

1983

return m

1983

return m

1984

1985

def getstorage(self, tree):

1985

def getstorage(self, tree):

1986

return self._rootstore.dirlog(tree)

1986

return self._rootstore.dirlog(tree)

1987

1988

def clearcaches(self, clear_persisted_data=False):

1988

def clearcaches(self, clear_persisted_data=False):

1989

self._dirmancache.clear()

1989

self._dirmancache.clear()

1990

self._rootstore.clearcaches(clear_persisted_data=clear_persisted_data)

1990

self._rootstore.clearcaches(clear_persisted_data=clear_persisted_data)

1991

1992

def rev(self, node):

1992

def rev(self, node):

1993

return self._rootstore.rev(node)

1993

return self._rootstore.rev(node)

1994

1995

def update_caches(self, transaction):

1995

def update_caches(self, transaction):

1996

return self._rootstore._revlog.update_caches(transaction=transaction)

1996

return self._rootstore._revlog.update_caches(transaction=transaction)

1997

1998

1999

@interfaceutil.implementer(repository.imanifestrevisionwritable)

1999

@interfaceutil.implementer(repository.imanifestrevisionwritable)

2000

class memmanifestctx(object):

2000

class memmanifestctx(object):

2001

def __init__(self, manifestlog):

2001

def __init__(self, manifestlog):

2002

self._manifestlog = manifestlog

2002

self._manifestlog = manifestlog

2003

self._manifestdict = manifestdict()

2003

self._manifestdict = manifestdict()

2004

2005

def _storage(self):

2005

def _storage(self):

2006

return self._manifestlog.getstorage(b'')

2006

return self._manifestlog.getstorage(b'')

2007

2008

def copy(self):

2008

def copy(self):

2009

memmf = memmanifestctx(self._manifestlog)

2009

memmf = memmanifestctx(self._manifestlog)

2010

memmf._manifestdict = self.read().copy()

2010

memmf._manifestdict = self.read().copy()

2011

return memmf

2011

return memmf

2012

2013

def read(self):

2013

def read(self):

2014

return self._manifestdict

2014

return self._manifestdict

2015

2016

def write(self, transaction, link, p1, p2, added, removed, match=None):

2016

def write(self, transaction, link, p1, p2, added, removed, match=None):

2017

return self._storage().add(

2017

return self._storage().add(

2018

self._manifestdict,

2018

self._manifestdict,

2019

transaction,

2019

transaction,

2020

link,

2020

link,

2021

p1,

2021

p1,

2022

p2,

2022

p2,

2023

added,

2023

added,

2024

removed,

2024

removed,

2025

match=match,

2025

match=match,

2026

)

2026

)

2027

2028

2029

@interfaceutil.implementer(repository.imanifestrevisionstored)

2029

@interfaceutil.implementer(repository.imanifestrevisionstored)

2030

class manifestctx(object):

2030

class manifestctx(object):

2031

"""A class representing a single revision of a manifest, including its

2031

"""A class representing a single revision of a manifest, including its

2032

contents, its parent revs, and its linkrev.

2032

contents, its parent revs, and its linkrev.

2033

"""

2033

"""

2034

2035

def __init__(self, manifestlog, node):

2035

def __init__(self, manifestlog, node):

2036

self._manifestlog = manifestlog

2036

self._manifestlog = manifestlog

2037

self._data = None

2037

self._data = None

2038

2039

self._node = node

2039

self._node = node

2040

2041

# TODO: We eventually want p1, p2, and linkrev exposed on this class,

2041

# TODO: We eventually want p1, p2, and linkrev exposed on this class,

2042

# but let's add it later when something needs it and we can load it

2042

# but let's add it later when something needs it and we can load it

2043

# lazily.

2043

# lazily.

2044

# self.p1, self.p2 = store.parents(node)

2044

# self.p1, self.p2 = store.parents(node)

2045

# rev = store.rev(node)

2045

# rev = store.rev(node)

2046

# self.linkrev = store.linkrev(rev)

2046

# self.linkrev = store.linkrev(rev)

2047

2048

def _storage(self):

2048

def _storage(self):

2049

return self._manifestlog.getstorage(b'')

2049

return self._manifestlog.getstorage(b'')

2050

2051

def node(self):

2051

def node(self):

2052

return self._node

2052

return self._node

2053

2054

def copy(self):

2054

def copy(self):

2055

memmf = memmanifestctx(self._manifestlog)

2055

memmf = memmanifestctx(self._manifestlog)

2056

memmf._manifestdict = self.read().copy()

2056

memmf._manifestdict = self.read().copy()

2057

return memmf

2057

return memmf

2058

2059

@propertycache

2059

@propertycache

2060

def parents(self):

2060

def parents(self):

2061

return self._storage().parents(self._node)

2061

return self._storage().parents(self._node)

2062

2063

def read(self):

2063

def read(self):

2064

if self._data is None:

2064

if self._data is None:

2065

if self._node == nullid:

2065

if self._node == nullid:

2066

self._data = manifestdict()

2066

self._data = manifestdict()

2067

else:

2067

else:

2068

store = self._storage()

2068

store = self._storage()

2069

if self._node in store.fulltextcache:

2069

if self._node in store.fulltextcache:

2070

text = pycompat.bytestr(store.fulltextcache[self._node])

2070

text = pycompat.bytestr(store.fulltextcache[self._node])

2071

else:

2071

else:

2072

text = store.revision(self._node)

2072

text = store.revision(self._node)

2073

arraytext = bytearray(text)

2073

arraytext = bytearray(text)

2074

store.fulltextcache[self._node] = arraytext

2074

store.fulltextcache[self._node] = arraytext

2075

self._data = manifestdict(text)

2075

self._data = manifestdict(text)

2076

return self._data

2076

return self._data

2077

2078

def readfast(self, shallow=False):

2078

def readfast(self, shallow=False):

2079

"""Calls either readdelta or read, based on which would be less work.

2079

"""Calls either readdelta or read, based on which would be less work.

2080

readdelta is called if the delta is against the p1, and therefore can be

2080

readdelta is called if the delta is against the p1, and therefore can be

2081

read quickly.

2081

read quickly.

2082

2083

If `shallow` is True, nothing changes since this is a flat manifest.

2083

If `shallow` is True, nothing changes since this is a flat manifest.

2084

"""

2084

"""

2085

store = self._storage()

2085

store = self._storage()

2086

r = store.rev(self._node)

2086

r = store.rev(self._node)

2087

deltaparent = store.deltaparent(r)

2087

deltaparent = store.deltaparent(r)

2088

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2088

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2089

return self.readdelta()

2089

return self.readdelta()

2090

return self.read()

2090

return self.read()

2091

2092

def readdelta(self, shallow=False):

2092

def readdelta(self, shallow=False):

2093

"""Returns a manifest containing just the entries that are present

2093

"""Returns a manifest containing just the entries that are present

2094

in this manifest, but not in its p1 manifest. This is efficient to read

2094

in this manifest, but not in its p1 manifest. This is efficient to read

2095

if the revlog delta is already p1.

2095

if the revlog delta is already p1.

2096

2097

Changing the value of `shallow` has no effect on flat manifests.

2097

Changing the value of `shallow` has no effect on flat manifests.

2098

"""

2098

"""

2099

store = self._storage()

2099

store = self._storage()

2100

r = store.rev(self._node)

2100

r = store.rev(self._node)

2101

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2101

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2102

return manifestdict(d)

2102

return manifestdict(d)

2103

2104

def find(self, key):

2104

def find(self, key):

2105

return self.read().find(key)

2105

return self.read().find(key)

2106

2107

2108

@interfaceutil.implementer(repository.imanifestrevisionwritable)

2108

@interfaceutil.implementer(repository.imanifestrevisionwritable)

2109

class memtreemanifestctx(object):

2109

class memtreemanifestctx(object):

2110

def __init__(self, manifestlog, dir=b''):

2110

def __init__(self, manifestlog, dir=b''):

2111

self._manifestlog = manifestlog

2111

self._manifestlog = manifestlog

2112

self._dir = dir

2112

self._dir = dir

2113

self._treemanifest = treemanifest()

2113

self._treemanifest = treemanifest()

2114

2115

def _storage(self):

2115

def _storage(self):

2116

return self._manifestlog.getstorage(b'')

2116

return self._manifestlog.getstorage(b'')

2117

2118

def copy(self):

2118

def copy(self):

2119

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2119

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2120

memmf._treemanifest = self._treemanifest.copy()

2120

memmf._treemanifest = self._treemanifest.copy()

2121

return memmf

2121

return memmf

2122

2123

def read(self):

2123

def read(self):

2124

return self._treemanifest

2124

return self._treemanifest

2125

2126

def write(self, transaction, link, p1, p2, added, removed, match=None):

2126

def write(self, transaction, link, p1, p2, added, removed, match=None):

2127

def readtree(dir, node):

2127

def readtree(dir, node):

2128

return self._manifestlog.get(dir, node).read()

2128

return self._manifestlog.get(dir, node).read()

2129

2130

return self._storage().add(

2130

return self._storage().add(

2131

self._treemanifest,

2131

self._treemanifest,

2132

transaction,

2132

transaction,

2133

link,

2133

link,

2134

p1,

2134

p1,

2135

p2,

2135

p2,

2136

added,

2136

added,

2137

removed,

2137

removed,

2138

readtree=readtree,

2138

readtree=readtree,

2139

match=match,

2139

match=match,

2140

)

2140

)

2141

2142

2143

@interfaceutil.implementer(repository.imanifestrevisionstored)

2143

@interfaceutil.implementer(repository.imanifestrevisionstored)

2144

class treemanifestctx(object):

2144

class treemanifestctx(object):

2145

def __init__(self, manifestlog, dir, node):

2145

def __init__(self, manifestlog, dir, node):

2146

self._manifestlog = manifestlog

2146

self._manifestlog = manifestlog

2147

self._dir = dir

2147

self._dir = dir

2148

self._data = None

2148

self._data = None

2149

2150

self._node = node

2150

self._node = node

2151

2152

# TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that

2152

# TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that

2153

# we can instantiate treemanifestctx objects for directories we don't

2153

# we can instantiate treemanifestctx objects for directories we don't

2154

# have on disk.

2154

# have on disk.

2155

# self.p1, self.p2 = store.parents(node)

2155

# self.p1, self.p2 = store.parents(node)

2156

# rev = store.rev(node)

2156

# rev = store.rev(node)

2157

# self.linkrev = store.linkrev(rev)

2157

# self.linkrev = store.linkrev(rev)

2158

2159

def _storage(self):

2159

def _storage(self):

2160

narrowmatch = self._manifestlog._narrowmatch

2160

narrowmatch = self._manifestlog._narrowmatch

2161

if not narrowmatch.always():

2161

if not narrowmatch.always():

2162

if not narrowmatch.visitdir(self._dir[:-1]):

2162

if not narrowmatch.visitdir(self._dir[:-1]):

2163

return excludedmanifestrevlog(self._dir)

2163

return excludedmanifestrevlog(self._dir)

2164

return self._manifestlog.getstorage(self._dir)

2164

return self._manifestlog.getstorage(self._dir)

2165

2166

def read(self):

2166

def read(self):

2167

if self._data is None:

2167

if self._data is None:

2168

store = self._storage()

2168

store = self._storage()

2169

if self._node == nullid:

2169

if self._node == nullid:

2170

self._data = treemanifest()

2170

self._data = treemanifest()

2171

# TODO accessing non-public API

2171

# TODO accessing non-public API

2172

elif store._treeondisk:

2172

elif store._treeondisk:

2173

m = treemanifest(dir=self._dir)

2173

m = treemanifest(dir=self._dir)

2174

2175

def gettext():

2175

def gettext():

2176

return store.revision(self._node)

2176

return store.revision(self._node)

2177

2178

def readsubtree(dir, subm):

2178

def readsubtree(dir, subm):

2179

# Set verify to False since we need to be able to create

2179

# Set verify to False since we need to be able to create

2180

# subtrees for trees that don't exist on disk.

2180

# subtrees for trees that don't exist on disk.

2181

return self._manifestlog.get(dir, subm, verify=False).read()

2181

return self._manifestlog.get(dir, subm, verify=False).read()

2182

2183

m.read(gettext, readsubtree)

2183

m.read(gettext, readsubtree)

2184

m.setnode(self._node)

2184

m.setnode(self._node)

2185

self._data = m

2185

self._data = m

2186

else:

2186

else:

2187

if self._node in store.fulltextcache:

2187

if self._node in store.fulltextcache:

2188

text = pycompat.bytestr(store.fulltextcache[self._node])

2188

text = pycompat.bytestr(store.fulltextcache[self._node])

2189

else:

2189

else:

2190

text = store.revision(self._node)

2190

text = store.revision(self._node)

2191

arraytext = bytearray(text)

2191

arraytext = bytearray(text)

2192

store.fulltextcache[self._node] = arraytext

2192

store.fulltextcache[self._node] = arraytext

2193

self._data = treemanifest(dir=self._dir, text=text)

2193

self._data = treemanifest(dir=self._dir, text=text)

2194

2195

return self._data

2195

return self._data

2196

2197

def node(self):

2197

def node(self):

2198

return self._node

2198

return self._node

2199

2200

def copy(self):

2200

def copy(self):

2201

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2201

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2202

memmf._treemanifest = self.read().copy()

2202

memmf._treemanifest = self.read().copy()

2203

return memmf

2203

return memmf

2204

2205

@propertycache

2205

@propertycache

2206

def parents(self):

2206

def parents(self):

2207

return self._storage().parents(self._node)

2207

return self._storage().parents(self._node)

2208

2209

def readdelta(self, shallow=False):

2209

def readdelta(self, shallow=False):

2210

"""Returns a manifest containing just the entries that are present

2210

"""Returns a manifest containing just the entries that are present

2211

in this manifest, but not in its p1 manifest. This is efficient to read

2211

in this manifest, but not in its p1 manifest. This is efficient to read

2212

if the revlog delta is already p1.

2212

if the revlog delta is already p1.

2213

2214

If `shallow` is True, this will read the delta for this directory,

2214

If `shallow` is True, this will read the delta for this directory,

2215

without recursively reading subdirectory manifests. Instead, any

2215

without recursively reading subdirectory manifests. Instead, any

2216

subdirectory entry will be reported as it appears in the manifest, i.e.

2216

subdirectory entry will be reported as it appears in the manifest, i.e.

2217

the subdirectory will be reported among files and distinguished only by

2217

the subdirectory will be reported among files and distinguished only by

2218

its 't' flag.

2218

its 't' flag.

2219

"""

2219

"""

2220

store = self._storage()

2220

store = self._storage()

2221

if shallow:

2221

if shallow:

2222

r = store.rev(self._node)

2222

r = store.rev(self._node)

2223

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2223

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2224

return manifestdict(d)

2224

return manifestdict(d)

2225

else:

2225

else:

2226

# Need to perform a slow delta

2226

# Need to perform a slow delta

2227

r0 = store.deltaparent(store.rev(self._node))

2227

r0 = store.deltaparent(store.rev(self._node))

2228

m0 = self._manifestlog.get(self._dir, store.node(r0)).read()

2228

m0 = self._manifestlog.get(self._dir, store.node(r0)).read()

2229

m1 = self.read()

2229

m1 = self.read()

2230

md = treemanifest(dir=self._dir)

2230

md = treemanifest(dir=self._dir)

2231

for f, ((n0, fl0), (n1, fl1)) in pycompat.iteritems(m0.diff(m1)):

2231

for f, ((n0, fl0), (n1, fl1)) in pycompat.iteritems(m0.diff(m1)):

2232

if n1:

2232

if n1:

2233

md[f] = n1

2233

md[f] = n1

2234

if fl1:

2234

if fl1:

2235

md.setflag(f, fl1)

2235

md.setflag(f, fl1)

2236

return md

2236

return md

2237

2238

def readfast(self, shallow=False):

2238

def readfast(self, shallow=False):

2239

"""Calls either readdelta or read, based on which would be less work.

2239

"""Calls either readdelta or read, based on which would be less work.

2240

readdelta is called if the delta is against the p1, and therefore can be

2240

readdelta is called if the delta is against the p1, and therefore can be

2241

read quickly.

2241

read quickly.

2242

2243

If `shallow` is True, it only returns the entries from this manifest,

2243

If `shallow` is True, it only returns the entries from this manifest,

2244

and not any submanifests.

2244

and not any submanifests.

2245

"""

2245

"""

2246

store = self._storage()

2246

store = self._storage()

2247

r = store.rev(self._node)

2247

r = store.rev(self._node)

2248

deltaparent = store.deltaparent(r)

2248

deltaparent = store.deltaparent(r)

2249

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2249

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2250

return self.readdelta(shallow=shallow)

2250

return self.readdelta(shallow=shallow)

2251

2252

if shallow:

2252

if shallow:

2253

return manifestdict(store.revision(self._node))

2253

return manifestdict(store.revision(self._node))

2254

else:

2254

else:

2255

return self.read()

2255

return self.read()

2256

2257

def find(self, key):

2257

def find(self, key):

2258

return self.read().find(key)

2258

return self.read().find(key)

2259

2260

2261

class excludeddir(treemanifest):

2261

class excludeddir(treemanifest):

2262

"""Stand-in for a directory that is excluded from the repository.

2262

"""Stand-in for a directory that is excluded from the repository.

2263

2264

With narrowing active on a repository that uses treemanifests,

2264

With narrowing active on a repository that uses treemanifests,

2265

some of the directory revlogs will be excluded from the resulting

2265

some of the directory revlogs will be excluded from the resulting

2266

clone. This is a huge storage win for clients, but means we need

2266

clone. This is a huge storage win for clients, but means we need

2267

some sort of pseudo-manifest to surface to internals so we can

2267

some sort of pseudo-manifest to surface to internals so we can

2268

detect a merge conflict outside the narrowspec. That's what this

2268

detect a merge conflict outside the narrowspec. That's what this

2269

class is: it stands in for a directory whose node is known, but

2269

class is: it stands in for a directory whose node is known, but

2270

whose contents are unknown.

2270

whose contents are unknown.

2271

"""

2271

"""

2272

2273

def __init__(self, dir, node):

2273

def __init__(self, dir, node):

2274

super(excludeddir, self).__init__(dir)

2274

super(excludeddir, self).__init__(dir)

2275

self._node = node

2275

self._node = node

2276

# Add an empty file, which will be included by iterators and such,

2276

# Add an empty file, which will be included by iterators and such,

2277

# appearing as the directory itself (i.e. something like "dir/")

2277

# appearing as the directory itself (i.e. something like "dir/")

2278

self._files[b''] = node

2278

self._files[b''] = node

2279

self._flags[b''] = b't'

2279

self._flags[b''] = b't'

2280

2281

# Manifests outside the narrowspec should never be modified, so avoid

2281

# Manifests outside the narrowspec should never be modified, so avoid

2282

# copying. This makes a noticeable difference when there are very many

2282

# copying. This makes a noticeable difference when there are very many

2283

# directories outside the narrowspec. Also, it makes sense for the copy to

2283

# directories outside the narrowspec. Also, it makes sense for the copy to

2284

# be of the same type as the original, which would not happen with the

2284

# be of the same type as the original, which would not happen with the

2285

# super type's copy().

2285

# super type's copy().

2286

def copy(self):

2286

def copy(self):

2287

return self

2287

return self

2288

2289

2290

class excludeddirmanifestctx(treemanifestctx):

2290

class excludeddirmanifestctx(treemanifestctx):

2291

"""context wrapper for excludeddir - see that docstring for rationale"""

2291

"""context wrapper for excludeddir - see that docstring for rationale"""

2292

2293

def __init__(self, dir, node):

2293

def __init__(self, dir, node):

2294

self._dir = dir

2294

self._dir = dir

2295

self._node = node

2295

self._node = node

2296

2297

def read(self):

2297

def read(self):

2298

return excludeddir(self._dir, self._node)

2298

return excludeddir(self._dir, self._node)

2299

2300

def readfast(self, shallow=False):

2301

# special version of readfast since we don't have underlying storage

2302

return self.read()

2303

2300

def write(self, *args):

2304

def write(self, *args):

2301

raise error.ProgrammingError(

2305

raise error.ProgrammingError(

2302

b'attempt to write manifest from excluded dir %s' % self._dir

2306

b'attempt to write manifest from excluded dir %s' % self._dir

2303

)

2307

)

2304

2308

2305

2309

2306

class excludedmanifestrevlog(manifestrevlog):

2310

class excludedmanifestrevlog(manifestrevlog):

2307

"""Stand-in for excluded treemanifest revlogs.

2311

"""Stand-in for excluded treemanifest revlogs.

2308

2312

2309

When narrowing is active on a treemanifest repository, we'll have

2313

When narrowing is active on a treemanifest repository, we'll have

2310

references to directories we can't see due to the revlog being

2314

references to directories we can't see due to the revlog being

2311

skipped. This class exists to conform to the manifestrevlog

2315

skipped. This class exists to conform to the manifestrevlog

2312

interface for those directories and proactively prevent writes to

2316

interface for those directories and proactively prevent writes to

2313

outside the narrowspec.

2317

outside the narrowspec.

2314

"""

2318

"""

2315

2319

2316

def __init__(self, dir):

2320

def __init__(self, dir):

2317

self._dir = dir

2321

self._dir = dir

2318

2322

2319

def __len__(self):

2323

def __len__(self):

2320

raise error.ProgrammingError(

2324

raise error.ProgrammingError(

2321

b'attempt to get length of excluded dir %s' % self._dir

2325

b'attempt to get length of excluded dir %s' % self._dir

2322

)

2326

)

2323

2327

2324

def rev(self, node):

2328

def rev(self, node):

2325

raise error.ProgrammingError(

2329

raise error.ProgrammingError(

2326

b'attempt to get rev from excluded dir %s' % self._dir

2330

b'attempt to get rev from excluded dir %s' % self._dir

2327

)

2331

)

2328

2332

2329

def linkrev(self, node):

2333

def linkrev(self, node):

2330

raise error.ProgrammingError(

2334

raise error.ProgrammingError(

2331

b'attempt to get linkrev from excluded dir %s' % self._dir

2335

b'attempt to get linkrev from excluded dir %s' % self._dir

2332

)

2336

)

2333

2337

2334

def node(self, rev):

2338

def node(self, rev):

2335

raise error.ProgrammingError(

2339

raise error.ProgrammingError(

2336

b'attempt to get node from excluded dir %s' % self._dir

2340

b'attempt to get node from excluded dir %s' % self._dir

2337

)

2341

)

2338

2342

2339

def add(self, *args, **kwargs):

2343

def add(self, *args, **kwargs):

2340

# We should never write entries in dirlogs outside the narrow clone.

2344

# We should never write entries in dirlogs outside the narrow clone.

2341

# However, the method still gets called from writesubtree() in

2345

# However, the method still gets called from writesubtree() in

2342

# _addtree(), so we need to handle it. We should possibly make that

2346

# _addtree(), so we need to handle it. We should possibly make that

2343

# avoid calling add() with a clean manifest (_dirty is always False

2347

# avoid calling add() with a clean manifest (_dirty is always False

2344

# in excludeddir instances).

2348

# in excludeddir instances).

2345

pass

2349

pass

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # manifest.py - manifest revision class for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import heapq
             import itertools
             import struct
             import weakref
             from .i18n import _
             from .node import (
                 bin,
                 hex,
                 nullid,
                 nullrev,
             )
             from .pycompat import getattr
             from . import (
                 encoding,
                 error,
                 match as matchmod,
                 mdiff,
                 pathutil,
                 policy,
                 pycompat,
                 revlog,
                 util,
             )
             from .interfaces import (
                 repository,
                 util as interfaceutil,
             )
             parsers = policy.importmod('parsers')
             propertycache = util.propertycache
             # Allow tests to more easily test the alternate path in manifestdict.fastdelta()
             FASTDELTA_TEXTDIFF_THRESHOLD = 1000
             def _parse(data):
                 # This method does a little bit of excessive-looking
                 # precondition checking. This is so that the behavior of this
                 # class exactly matches its C counterpart to try and help
                 # prevent surprise breakage for anyone that develops against
                 # the pure version.
                 if data and data[-1:] != b'\n':
                     raise ValueError(b'Manifest did not end in a newline.')
                 prev = None
                 for l in data.splitlines():
                     if prev is not None and prev > l:
                         raise ValueError(b'Manifest lines not in sorted order.')
                     prev = l
                     f, n = l.split(b'\0')
                     nl = len(n)
                     flags = n[-1:]
                     if flags in _manifestflags:
                         n = n[:-1]
                         nl -= 1
                     else:
                         flags = b''
                     if nl not in (40, 64):
                         raise ValueError(b'Invalid manifest line')
                     yield f, bin(n), flags
             def _text(it):
                 files = []
                 lines = []
                 for f, n, fl in it:
                     files.append(f)
                     # if this is changed to support newlines in filenames,
                     # be sure to check the templates/ dir again (especially *-raw.tmpl)
                     lines.append(b"%s\0%s%s\n" % (f, hex(n), fl))
                 _checkforbidden(files)
                 return b''.join(lines)
             class lazymanifestiter(object):
                 def __init__(self, lm):
                     self.pos = 0
                     self.lm = lm
                 def __iter__(self):
                     return self
                 def next(self):
                     try:
                         data, pos = self.lm._get(self.pos)
                     except IndexError:
                         raise StopIteration
                     if pos == -1:
                         self.pos += 1
                         return data[0]
                     self.pos += 1
                     zeropos = data.find(b'\x00', pos)
                     return data[pos:zeropos]
                 __next__ = next
             class lazymanifestiterentries(object):
                 def __init__(self, lm):
                     self.lm = lm
                     self.pos = 0
                 def __iter__(self):
                     return self
                 def next(self):
                     try:
                         data, pos = self.lm._get(self.pos)
                     except IndexError:
                         raise StopIteration
                     if pos == -1:
                         self.pos += 1
                         return data
                     zeropos = data.find(b'\x00', pos)
                     nlpos = data.find(b'\n', pos)
                     if zeropos == -1 or nlpos == -1 or nlpos < zeropos:
                         raise error.StorageError(b'Invalid manifest line')
                     flags = data[nlpos - 1 : nlpos]
                     if flags in _manifestflags:
                         hlen = nlpos - zeropos - 2
                     else:
                         hlen = nlpos - zeropos - 1
                         flags = b''
                     if hlen not in (40, 64):
                         raise error.StorageError(b'Invalid manifest line')
                     hashval = unhexlify(
                         data, self.lm.extrainfo[self.pos], zeropos + 1, hlen
                     )
                     self.pos += 1
                     return (data[pos:zeropos], hashval, flags)
                 __next__ = next
             def unhexlify(data, extra, pos, length):
                 s = bin(data[pos : pos + length])
                 if extra:
                     s += chr(extra & 0xFF)
                 return s
             def _cmp(a, b):
                 return (a > b) - (a < b)
             _manifestflags = {b'', b'l', b't', b'x'}
             class _lazymanifest(object):
                 """A pure python manifest backed by a byte string.  It is supplimented with
                 internal lists as it is modified, until it is compacted back to a pure byte
                 string.
                 ``data`` is the initial manifest data.
                 ``positions`` is a list of offsets, one per manifest entry.  Positive
                 values are offsets into ``data``, negative values are offsets into the
                 ``extradata`` list.  When an entry is removed, its entry is dropped from
                 ``positions``.  The values are encoded such that when walking the list and
                 indexing into ``data`` or ``extradata`` as appropriate, the entries are
                 sorted by filename.
                 ``extradata`` is a list of (key, hash, flags) for entries that were added or
                 modified since the manifest was created or compacted.
                 """
                 def __init__(
                     self,
                     data,
                     positions=None,
                     extrainfo=None,
                     extradata=None,
                     hasremovals=False,
                 ):
                     if positions is None:
                         self.positions = self.findlines(data)
                         self.extrainfo = [0] * len(self.positions)
                         self.data = data
                         self.extradata = []
                         self.hasremovals = False
                     else:
                         self.positions = positions[:]
                         self.extrainfo = extrainfo[:]
                         self.extradata = extradata[:]
                         self.data = data
                         self.hasremovals = hasremovals
                 def findlines(self, data):
                     if not data:
                         return []
                     pos = data.find(b"\n")
                     if pos == -1 or data[-1:] != b'\n':
                         raise ValueError(b"Manifest did not end in a newline.")
                     positions = [0]
                     prev = data[: data.find(b'\x00')]
                     while pos < len(data) - 1 and pos != -1:
                         positions.append(pos + 1)
                         nexts = data[pos + 1 : data.find(b'\x00', pos + 1)]
                         if nexts < prev:
                             raise ValueError(b"Manifest lines not in sorted order.")
                         prev = nexts
                         pos = data.find(b"\n", pos + 1)
                     return positions
                 def _get(self, index):
                     # get the position encoded in pos:
                     #   positive number is an index in 'data'
                     #   negative number is in extrapieces
                     pos = self.positions[index]
                     if pos >= 0:
                         return self.data, pos
                     return self.extradata[-pos - 1], -1
                 def _getkey(self, pos):
                     if pos >= 0:
                         return self.data[pos : self.data.find(b'\x00', pos + 1)]
                     return self.extradata[-pos - 1][0]
                 def bsearch(self, key):
                     first = 0
                     last = len(self.positions) - 1
                     while first <= last:
                         midpoint = (first + last) // 2
                         nextpos = self.positions[midpoint]
                         candidate = self._getkey(nextpos)
                         r = _cmp(key, candidate)
                         if r == 0:
                             return midpoint
                         else:
                             if r < 0:
                                 last = midpoint - 1
                             else:
                                 first = midpoint + 1
                     return -1
                 def bsearch2(self, key):
                     # same as the above, but will always return the position
                     # done for performance reasons
                     first = 0
                     last = len(self.positions) - 1
                     while first <= last:
                         midpoint = (first + last) // 2
                         nextpos = self.positions[midpoint]
                         candidate = self._getkey(nextpos)
                         r = _cmp(key, candidate)
                         if r == 0:
                             return (midpoint, True)
                         else:
                             if r < 0:
                                 last = midpoint - 1
                             else:
                                 first = midpoint + 1
                     return (first, False)
                 def __contains__(self, key):
                     return self.bsearch(key) != -1
                 def __getitem__(self, key):
                     if not isinstance(key, bytes):
                         raise TypeError(b"getitem: manifest keys must be a bytes.")
                     needle = self.bsearch(key)
                     if needle == -1:
                         raise KeyError
                     data, pos = self._get(needle)
                     if pos == -1:
                         return (data[1], data[2])
                     zeropos = data.find(b'\x00', pos)
                     nlpos = data.find(b'\n', zeropos)
                     assert 0 <= needle <= len(self.positions)
                     assert len(self.extrainfo) == len(self.positions)
                     if zeropos == -1 or nlpos == -1 or nlpos < zeropos:
                         raise error.StorageError(b'Invalid manifest line')
                     hlen = nlpos - zeropos - 1
                     flags = data[nlpos - 1 : nlpos]
                     if flags in _manifestflags:
                         hlen -= 1
                     else:
                         flags = b''
                     if hlen not in (40, 64):
                         raise error.StorageError(b'Invalid manifest line')
                     hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, hlen)
                     return (hashval, flags)
                 def __delitem__(self, key):
                     needle, found = self.bsearch2(key)
                     if not found:
                         raise KeyError
                     cur = self.positions[needle]
                     self.positions = self.positions[:needle] + self.positions[needle + 1 :]
                     self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1 :]
                     if cur >= 0:
                         # This does NOT unsort the list as far as the search functions are
                         # concerned, as they only examine lines mapped by self.positions.
                         self.data = self.data[:cur] + b'\x00' + self.data[cur + 1 :]
                         self.hasremovals = True
                 def __setitem__(self, key, value):
                     if not isinstance(key, bytes):
                         raise TypeError(b"setitem: manifest keys must be a byte string.")
                     if not isinstance(value, tuple) or len(value) != 2:
                         raise TypeError(
                             b"Manifest values must be a tuple of (node, flags)."
                         )
                     hashval = value[0]
                     if not isinstance(hashval, bytes) or len(hashval) not in (20, 32):
                         raise TypeError(b"node must be a 20-byte or 32-byte byte string")
                     flags = value[1]
                     if not isinstance(flags, bytes) or len(flags) > 1:
                         raise TypeError(b"flags must a 0 or 1 byte string, got %r", flags)
                     needle, found = self.bsearch2(key)
                     if found:
                         # put the item
                         pos = self.positions[needle]
                         if pos < 0:
                             self.extradata[-pos - 1] = (key, hashval, value[1])
                         else:
                             # just don't bother
                             self.extradata.append((key, hashval, value[1]))
                             self.positions[needle] = -len(self.extradata)
                     else:
                         # not found, put it in with extra positions
                         self.extradata.append((key, hashval, value[1]))
                         self.positions = (
                             self.positions[:needle]
                             + [-len(self.extradata)]
                             + self.positions[needle:]
                         )
                         self.extrainfo = (
                             self.extrainfo[:needle] + [0] + self.extrainfo[needle:]
                         )
                 def copy(self):
                     # XXX call _compact like in C?
                     return _lazymanifest(
                         self.data,
                         self.positions,
                         self.extrainfo,
                         self.extradata,
                         self.hasremovals,
                     )
                 def _compact(self):
                     # hopefully not called TOO often
                     if len(self.extradata) == 0 and not self.hasremovals:
                         return
                     l = []
                     i = 0
                     offset = 0
                     self.extrainfo = [0] * len(self.positions)
                     while i < len(self.positions):
                         if self.positions[i] >= 0:
                             cur = self.positions[i]
                             last_cut = cur
                             # Collect all contiguous entries in the buffer at the current
                             # offset, breaking out only for added/modified items held in
                             # extradata, or a deleted line prior to the next position.
                             while True:
                                 self.positions[i] = offset
                                 i += 1
                                 if i == len(self.positions) or self.positions[i] < 0:
                                     break
                                 # A removed file has no positions[] entry, but does have an
                                 # overwritten first byte.  Break out and find the end of the
                                 # current good entry/entries if there is a removed file
                                 # before the next position.
                                 if (
                                     self.hasremovals
                                     and self.data.find(b'\n\x00', cur, self.positions[i])
                                     != -1
                                 ):
                                     break
                                 offset += self.positions[i] - cur
                                 cur = self.positions[i]
                             end_cut = self.data.find(b'\n', cur)
                             if end_cut != -1:
                                 end_cut += 1
                             offset += end_cut - cur
                             l.append(self.data[last_cut:end_cut])
                         else:
                             while i < len(self.positions) and self.positions[i] < 0:
                                 cur = self.positions[i]
                                 t = self.extradata[-cur - 1]
                                 l.append(self._pack(t))
                                 self.positions[i] = offset
                                 # Hashes are either 20 bytes (old sha1s) or 32
                                 # bytes (new non-sha1).
                                 hlen = 20
                                 if len(t[1]) > 25:
                                     hlen = 32
                                 if len(t[1]) > hlen:
                                     self.extrainfo[i] = ord(t[1][hlen + 1])
                                 offset += len(l[-1])
                                 i += 1
                     self.data = b''.join(l)
                     self.hasremovals = False
                     self.extradata = []
                 def _pack(self, d):
                     n = d[1]
                     assert len(n) in (20, 32)
                     return d[0] + b'\x00' + hex(n) + d[2] + b'\n'
                 def text(self):
                     self._compact()
                     return self.data
                 def diff(self, m2, clean=False):
                     '''Finds changes between the current manifest and m2.'''
                     # XXX think whether efficiency matters here
                     diff = {}
                     for fn, e1, flags in self.iterentries():
                         if fn not in m2:
                             diff[fn] = (e1, flags), (None, b'')
                         else:
                             e2 = m2[fn]
                             if (e1, flags) != e2:
                                 diff[fn] = (e1, flags), e2
                             elif clean:
                                 diff[fn] = None
                     for fn, e2, flags in m2.iterentries():
                         if fn not in self:
                             diff[fn] = (None, b''), (e2, flags)
                     return diff
                 def iterentries(self):
                     return lazymanifestiterentries(self)
                 def iterkeys(self):
                     return lazymanifestiter(self)
                 def __iter__(self):
                     return lazymanifestiter(self)
                 def __len__(self):
                     return len(self.positions)
                 def filtercopy(self, filterfn):
                     # XXX should be optimized
                     c = _lazymanifest(b'')
                     for f, n, fl in self.iterentries():
                         if filterfn(f):
                             c[f] = n, fl
                     return c
             try:
                 _lazymanifest = parsers.lazymanifest
             except AttributeError:
                 pass
             @interfaceutil.implementer(repository.imanifestdict)
             class manifestdict(object):
                 def __init__(self, data=b''):
                     self._lm = _lazymanifest(data)
                 def __getitem__(self, key):
                     return self._lm[key][0]
                 def find(self, key):
                     return self._lm[key]
                 def __len__(self):
                     return len(self._lm)
                 def __nonzero__(self):
                     # nonzero is covered by the __len__ function, but implementing it here
                     # makes it easier for extensions to override.
                     return len(self._lm) != 0
                 __bool__ = __nonzero__
                 def __setitem__(self, key, node):
                     self._lm[key] = node, self.flags(key)
                 def __contains__(self, key):
                     if key is None:
                         return False
                     return key in self._lm
                 def __delitem__(self, key):
                     del self._lm[key]
                 def __iter__(self):
                     return self._lm.__iter__()
                 def iterkeys(self):
                     return self._lm.iterkeys()
                 def keys(self):
                     return list(self.iterkeys())
                 def filesnotin(self, m2, match=None):
                     '''Set of files in this manifest that are not in the other'''
                     if match is not None:
                         match = matchmod.badmatch(match, lambda path, msg: None)
                         sm2 = set(m2.walk(match))
                         return {f for f in self.walk(match) if f not in sm2}
                     return {f for f in self if f not in m2}
                 @propertycache
                 def _dirs(self):
                     return pathutil.dirs(self)
                 def dirs(self):
                     return self._dirs
                 def hasdir(self, dir):
                     return dir in self._dirs
                 def _filesfastpath(self, match):
                     """Checks whether we can correctly and quickly iterate over matcher
                     files instead of over manifest files."""
                     files = match.files()
                     return len(files) < 100 and (
                         match.isexact()
                         or (match.prefix() and all(fn in self for fn in files))
                     )
                 def walk(self, match):
                     """Generates matching file names.
                     Equivalent to manifest.matches(match).iterkeys(), but without creating
                     an entirely new manifest.
                     It also reports nonexistent files by marking them bad with match.bad().
                     """
                     if match.always():
                         for f in iter(self):
                             yield f
                         return
                     fset = set(match.files())
                     # avoid the entire walk if we're only looking for specific files
                     if self._filesfastpath(match):
                         for fn in sorted(fset):
                             if fn in self:
                                 yield fn
                         return
                     for fn in self:
                         if fn in fset:
                             # specified pattern is the exact name
                             fset.remove(fn)
                         if match(fn):
                             yield fn
                     # for dirstate.walk, files=[''] means "walk the whole tree".
                     # follow that here, too
                     fset.discard(b'')
                     for fn in sorted(fset):
                         if not self.hasdir(fn):
                             match.bad(fn, None)
                 def _matches(self, match):
                     '''generate a new manifest filtered by the match argument'''
                     if match.always():
                         return self.copy()
                     if self._filesfastpath(match):
                         m = manifestdict()
                         lm = self._lm
                         for fn in match.files():
                             if fn in lm:
                                 m._lm[fn] = lm[fn]
                         return m
                     m = manifestdict()
                     m._lm = self._lm.filtercopy(match)
                     return m
                 def diff(self, m2, match=None, clean=False):
                     """Finds changes between the current manifest and m2.
                     Args:
                       m2: the manifest to which this manifest should be compared.
                       clean: if true, include files unchanged between these manifests
                              with a None value in the returned dictionary.
                     The result is returned as a dict with filename as key and
                     values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
                     nodeid in the current/other manifest and fl1/fl2 is the flag
                     in the current/other manifest. Where the file does not exist,
                     the nodeid will be None and the flags will be the empty
                     string.
                     """
                     if match:
                         m1 = self._matches(match)
                         m2 = m2._matches(match)
                         return m1.diff(m2, clean=clean)
                     return self._lm.diff(m2._lm, clean)
                 def setflag(self, key, flag):
                     if flag not in _manifestflags:
                         raise TypeError(b"Invalid manifest flag set.")
                     self._lm[key] = self[key], flag
                 def get(self, key, default=None):
                     try:
                         return self._lm[key][0]
                     except KeyError:
                         return default
                 def flags(self, key):
                     try:
                         return self._lm[key][1]
                     except KeyError:
                         return b''
                 def copy(self):
                     c = manifestdict()
                     c._lm = self._lm.copy()
                     return c
                 def items(self):
                     return (x[:2] for x in self._lm.iterentries())
                 def iteritems(self):
                     return (x[:2] for x in self._lm.iterentries())
                 def iterentries(self):
                     return self._lm.iterentries()
                 def text(self):
                     # most likely uses native version
                     return self._lm.text()
                 def fastdelta(self, base, changes):
                     """Given a base manifest text as a bytearray and a list of changes
                     relative to that text, compute a delta that can be used by revlog.
                     """
                     delta = []
                     dstart = None
                     dend = None
                     dline = [b""]
                     start = 0
                     # zero copy representation of base as a buffer
                     addbuf = util.buffer(base)
                     changes = list(changes)
                     if len(changes) < FASTDELTA_TEXTDIFF_THRESHOLD:
                         # start with a readonly loop that finds the offset of
                         # each line and creates the deltas
                         for f, todelete in changes:
                             # bs will either be the index of the item or the insert point
                             start, end = _msearch(addbuf, f, start)
                             if not todelete:
                                 h, fl = self._lm[f]
                                 l = b"%s\0%s%s\n" % (f, hex(h), fl)
                             else:
                                 if start == end:
                                     # item we want to delete was not found, error out
                                     raise AssertionError(
                                         _(b"failed to remove %s from manifest") % f
                                     )
                                 l = b""
                             if dstart is not None and dstart <= start and dend >= start:
                                 if dend < end:
                                     dend = end
                                 if l:
                                     dline.append(l)
                             else:
                                 if dstart is not None:
                                     delta.append([dstart, dend, b"".join(dline)])
                                 dstart = start
                                 dend = end
                                 dline = [l]
                         if dstart is not None:
                             delta.append([dstart, dend, b"".join(dline)])
                         # apply the delta to the base, and get a delta for addrevision
                         deltatext, arraytext = _addlistdelta(base, delta)
                     else:
                         # For large changes, it's much cheaper to just build the text and
                         # diff it.
                         arraytext = bytearray(self.text())
                         deltatext = mdiff.textdiff(
                             util.buffer(base), util.buffer(arraytext)
                         )
                     return arraytext, deltatext
             def _msearch(m, s, lo=0, hi=None):
                 """return a tuple (start, end) that says where to find s within m.
                 If the string is found m[start:end] are the line containing
                 that string.  If start == end the string was not found and
                 they indicate the proper sorted insertion point.
                 m should be a buffer, a memoryview or a byte string.
                 s is a byte string"""
                 def advance(i, c):
                     while i < lenm and m[i : i + 1] != c:
                         i += 1
                     return i
                 if not s:
                     return (lo, lo)
                 lenm = len(m)
                 if not hi:
                     hi = lenm
                 while lo < hi:
                     mid = (lo + hi) // 2
                     start = mid
                     while start > 0 and m[start - 1 : start] != b'\n':
                         start -= 1
                     end = advance(start, b'\0')
                     if bytes(m[start:end]) < s:
                         # we know that after the null there are 40 bytes of sha1
                         # this translates to the bisect lo = mid + 1
                         lo = advance(end + 40, b'\n') + 1
                     else:
                         # this translates to the bisect hi = mid
                         hi = start
                 end = advance(lo, b'\0')
                 found = m[lo:end]
                 if s == found:
                     # we know that after the null there are 40 bytes of sha1
                     end = advance(end + 40, b'\n')
                     return (lo, end + 1)
                 else:
                     return (lo, lo)
             def _checkforbidden(l):
                 """Check filenames for illegal characters."""
                 for f in l:
                     if b'\n' in f or b'\r' in f:
                         raise error.StorageError(
                             _(b"'\\n' and '\\r' disallowed in filenames: %r")
                             % pycompat.bytestr(f)
                         )
             # apply the changes collected during the bisect loop to our addlist
             # return a delta suitable for addrevision
             def _addlistdelta(addlist, x):
                 # for large addlist arrays, building a new array is cheaper
                 # than repeatedly modifying the existing one
                 currentposition = 0
                 newaddlist = bytearray()
                 for start, end, content in x:
                     newaddlist += addlist[currentposition:start]
                     if content:
                         newaddlist += bytearray(content)
                     currentposition = end
                 newaddlist += addlist[currentposition:]
                 deltatext = b"".join(
                     struct.pack(b">lll", start, end, len(content)) + content
                     for start, end, content in x
                 )
                 return deltatext, newaddlist
             def _splittopdir(f):
                 if b'/' in f:
                     dir, subpath = f.split(b'/', 1)
                     return dir + b'/', subpath
                 else:
                     return b'', f
             _noop = lambda s: None
             @interfaceutil.implementer(repository.imanifestdict)
             class treemanifest(object):
                 def __init__(self, dir=b'', text=b''):
                     self._dir = dir
                     self._node = nullid
                     self._loadfunc = _noop
                     self._copyfunc = _noop
                     self._dirty = False
                     self._dirs = {}
                     self._lazydirs = {}
                     # Using _lazymanifest here is a little slower than plain old dicts
                     self._files = {}
                     self._flags = {}
                     if text:
                         def readsubtree(subdir, subm):
                             raise AssertionError(
                                 b'treemanifest constructor only accepts flat manifests'
                             )
                         self.parse(text, readsubtree)
                         self._dirty = True  # Mark flat manifest dirty after parsing
                 def _subpath(self, path):
                     return self._dir + path
                 def _loadalllazy(self):
                     selfdirs = self._dirs
                     subpath = self._subpath
                     for d, (node, readsubtree, docopy) in pycompat.iteritems(
                         self._lazydirs
                     ):
                         if docopy:
                             selfdirs[d] = readsubtree(subpath(d), node).copy()
                         else:
                             selfdirs[d] = readsubtree(subpath(d), node)
                     self._lazydirs = {}
                 def _loadlazy(self, d):
                     v = self._lazydirs.get(d)
                     if v:
                         node, readsubtree, docopy = v
                         if docopy:
                             self._dirs[d] = readsubtree(self._subpath(d), node).copy()
                         else:
                             self._dirs[d] = readsubtree(self._subpath(d), node)
                         del self._lazydirs[d]
                 def _loadchildrensetlazy(self, visit):
                     if not visit:
                         return None
                     if visit == b'all' or visit == b'this':
                         self._loadalllazy()
                         return None
                     loadlazy = self._loadlazy
                     for k in visit:
                         loadlazy(k + b'/')
                     return visit
                 def _loaddifflazy(self, t1, t2):
                     """load items in t1 and t2 if they're needed for diffing.
                     The criteria currently is:
                     - if it's not present in _lazydirs in either t1 or t2, load it in the
                       other (it may already be loaded or it may not exist, doesn't matter)
                     - if it's present in _lazydirs in both, compare the nodeid; if it
                       differs, load it in both
                     """
                     toloadlazy = []
                     for d, v1 in pycompat.iteritems(t1._lazydirs):
                         v2 = t2._lazydirs.get(d)
                         if not v2 or v2[0] != v1[0]:
                             toloadlazy.append(d)
                     for d, v1 in pycompat.iteritems(t2._lazydirs):
                         if d not in t1._lazydirs:
                             toloadlazy.append(d)
                     for d in toloadlazy:
                         t1._loadlazy(d)
                         t2._loadlazy(d)
                 def __len__(self):
                     self._load()
                     size = len(self._files)
                     self._loadalllazy()
                     for m in self._dirs.values():
                         size += m.__len__()
                     return size
                 def __nonzero__(self):
                     # Faster than "__len() != 0" since it avoids loading sub-manifests
                     return not self._isempty()
                 __bool__ = __nonzero__
                 def _isempty(self):
                     self._load()  # for consistency; already loaded by all callers
                     # See if we can skip loading everything.
                     if self._files or (
                         self._dirs and any(not m._isempty() for m in self._dirs.values())
                     ):
                         return False
                     self._loadalllazy()
                     return not self._dirs or all(m._isempty() for m in self._dirs.values())
                 @encoding.strmethod
                 def __repr__(self):
                     return (
                         b'<treemanifest dir=%s, node=%s, loaded=%r, dirty=%r at 0x%x>'
                         % (
                             self._dir,
                             hex(self._node),
                             bool(self._loadfunc is _noop),
                             self._dirty,
                             id(self),
                         )
                     )
                 def dir(self):
                     """The directory that this tree manifest represents, including a
                     trailing '/'. Empty string for the repo root directory."""
                     return self._dir
                 def node(self):
                     """This node of this instance. nullid for unsaved instances. Should
                     be updated when the instance is read or written from a revlog.
                     """
                     assert not self._dirty
                     return self._node
                 def setnode(self, node):
                     self._node = node
                     self._dirty = False
                 def iterentries(self):
                     self._load()
                     self._loadalllazy()
                     for p, n in sorted(
                         itertools.chain(self._dirs.items(), self._files.items())
                     ):
                         if p in self._files:
                             yield self._subpath(p), n, self._flags.get(p, b'')
                         else:
                             for x in n.iterentries():
                                 yield x
                 def items(self):
                     self._load()
                     self._loadalllazy()
                     for p, n in sorted(
                         itertools.chain(self._dirs.items(), self._files.items())
                     ):
                         if p in self._files:
                             yield self._subpath(p), n
                         else:
                             for f, sn in pycompat.iteritems(n):
                                 yield f, sn
                 iteritems = items
                 def iterkeys(self):
                     self._load()
                     self._loadalllazy()
                     for p in sorted(itertools.chain(self._dirs, self._files)):
                         if p in self._files:
                             yield self._subpath(p)
                         else:
                             for f in self._dirs[p]:
                                 yield f
                 def keys(self):
                     return list(self.iterkeys())
                 def __iter__(self):
                     return self.iterkeys()
                 def __contains__(self, f):
                     if f is None:
                         return False
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             return False
                         return self._dirs[dir].__contains__(subpath)
                     else:
                         return f in self._files
                 def get(self, f, default=None):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             return default
                         return self._dirs[dir].get(subpath, default)
                     else:
                         return self._files.get(f, default)
                 def __getitem__(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         return self._dirs[dir].__getitem__(subpath)
                     else:
                         return self._files[f]
                 def flags(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             return b''
                         return self._dirs[dir].flags(subpath)
                     else:
                         if f in self._lazydirs or f in self._dirs:
                             return b''
                         return self._flags.get(f, b'')
                 def find(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         return self._dirs[dir].find(subpath)
                     else:
                         return self._files[f], self._flags.get(f, b'')
                 def __delitem__(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         self._dirs[dir].__delitem__(subpath)
                         # If the directory is now empty, remove it
                         if self._dirs[dir]._isempty():
                             del self._dirs[dir]
                     else:
                         del self._files[f]
                         if f in self._flags:
                             del self._flags[f]
                     self._dirty = True
                 def __setitem__(self, f, n):
                     assert n is not None
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             self._dirs[dir] = treemanifest(self._subpath(dir))
                         self._dirs[dir].__setitem__(subpath, n)
                     else:
                         # manifest nodes are either 20 bytes or 32 bytes,
                         # depending on the hash in use. Assert this as historically
                         # sometimes extra bytes were added.
                         assert len(n) in (20, 32)
                         self._files[f] = n
                     self._dirty = True
                 def _load(self):
                     if self._loadfunc is not _noop:
                         lf, self._loadfunc = self._loadfunc, _noop
                         lf(self)
                     elif self._copyfunc is not _noop:
                         cf, self._copyfunc = self._copyfunc, _noop
                         cf(self)
                 def setflag(self, f, flags):
                     """Set the flags (symlink, executable) for path f."""
                     if flags not in _manifestflags:
                         raise TypeError(b"Invalid manifest flag set.")
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             self._dirs[dir] = treemanifest(self._subpath(dir))
                         self._dirs[dir].setflag(subpath, flags)
                     else:
                         self._flags[f] = flags
                     self._dirty = True
                 def copy(self):
                     copy = treemanifest(self._dir)
                     copy._node = self._node
                     copy._dirty = self._dirty
                     if self._copyfunc is _noop:
                         def _copyfunc(s):
                             self._load()
                             s._lazydirs = {
                                 d: (n, r, True)
                                 for d, (n, r, c) in pycompat.iteritems(self._lazydirs)
                             }
                             sdirs = s._dirs
                             for d, v in pycompat.iteritems(self._dirs):
                                 sdirs[d] = v.copy()
                             s._files = dict.copy(self._files)
                             s._flags = dict.copy(self._flags)
                         if self._loadfunc is _noop:
                             _copyfunc(copy)
                         else:
                             copy._copyfunc = _copyfunc
                     else:
                         copy._copyfunc = self._copyfunc
                     return copy
                 def filesnotin(self, m2, match=None):
                     '''Set of files in this manifest that are not in the other'''
                     if match and not match.always():
                         m1 = self._matches(match)
                         m2 = m2._matches(match)
                         return m1.filesnotin(m2)
                     files = set()
                     def _filesnotin(t1, t2):
                         if t1._node == t2._node and not t1._dirty and not t2._dirty:
                             return
                         t1._load()
                         t2._load()
                         self._loaddifflazy(t1, t2)
                         for d, m1 in pycompat.iteritems(t1._dirs):
                             if d in t2._dirs:
                                 m2 = t2._dirs[d]
                                 _filesnotin(m1, m2)
                             else:
                                 files.update(m1.iterkeys())
                         for fn in t1._files:
                             if fn not in t2._files:
                                 files.add(t1._subpath(fn))
                     _filesnotin(self, m2)
                     return files
                 @propertycache
                 def _alldirs(self):
                     return pathutil.dirs(self)
                 def dirs(self):
                     return self._alldirs
                 def hasdir(self, dir):
                     self._load()
                     topdir, subdir = _splittopdir(dir)
                     if topdir:
                         self._loadlazy(topdir)
                         if topdir in self._dirs:
                             return self._dirs[topdir].hasdir(subdir)
                         return False
                     dirslash = dir + b'/'
                     return dirslash in self._dirs or dirslash in self._lazydirs
                 def walk(self, match):
                     """Generates matching file names.
                     It also reports nonexistent files by marking them bad with match.bad().
                     """
                     if match.always():
                         for f in iter(self):
                             yield f
                         return
                     fset = set(match.files())
                     for fn in self._walk(match):
                         if fn in fset:
                             # specified pattern is the exact name
                             fset.remove(fn)
                         yield fn
                     # for dirstate.walk, files=[''] means "walk the whole tree".
                     # follow that here, too
                     fset.discard(b'')
                     for fn in sorted(fset):
                         if not self.hasdir(fn):
                             match.bad(fn, None)
                 def _walk(self, match):
                     '''Recursively generates matching file names for walk().'''
                     visit = match.visitchildrenset(self._dir[:-1])
                     if not visit:
                         return
                     # yield this dir's files and walk its submanifests
                     self._load()
                     visit = self._loadchildrensetlazy(visit)
                     for p in sorted(list(self._dirs) + list(self._files)):
                         if p in self._files:
                             fullp = self._subpath(p)
                             if match(fullp):
                                 yield fullp
                         else:
                             if not visit or p[:-1] in visit:
                                 for f in self._dirs[p]._walk(match):
                                     yield f
                 def _matches(self, match):
                     """recursively generate a new manifest filtered by the match argument."""
                     if match.always():
                         return self.copy()
                     return self._matches_inner(match)
                 def _matches_inner(self, match):
                     if match.always():
                         return self.copy()
                     visit = match.visitchildrenset(self._dir[:-1])
                     if visit == b'all':
                         return self.copy()
                     ret = treemanifest(self._dir)
                     if not visit:
                         return ret
                     self._load()
                     for fn in self._files:
                         # While visitchildrenset *usually* lists only subdirs, this is
                         # actually up to the matcher and may have some files in the set().
                         # If visit == 'this', we should obviously look at the files in this
                         # directory; if visit is a set, and fn is in it, we should inspect
                         # fn (but no need to inspect things not in the set).
                         if visit != b'this' and fn not in visit:
                             continue
                         fullp = self._subpath(fn)
                         # visitchildrenset isn't perfect, we still need to call the regular
                         # matcher code to further filter results.
                         if not match(fullp):
                             continue
                         ret._files[fn] = self._files[fn]
                         if fn in self._flags:
                             ret._flags[fn] = self._flags[fn]
                     visit = self._loadchildrensetlazy(visit)
                     for dir, subm in pycompat.iteritems(self._dirs):
                         if visit and dir[:-1] not in visit:
                             continue
                         m = subm._matches_inner(match)
                         if not m._isempty():
                             ret._dirs[dir] = m
                     if not ret._isempty():
                         ret._dirty = True
                     return ret
                 def fastdelta(self, base, changes):
                     raise FastdeltaUnavailable()
                 def diff(self, m2, match=None, clean=False):
                     """Finds changes between the current manifest and m2.
                     Args:
                       m2: the manifest to which this manifest should be compared.
                       clean: if true, include files unchanged between these manifests
                              with a None value in the returned dictionary.
                     The result is returned as a dict with filename as key and
                     values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
                     nodeid in the current/other manifest and fl1/fl2 is the flag
                     in the current/other manifest. Where the file does not exist,
                     the nodeid will be None and the flags will be the empty
                     string.
                     """
                     if match and not match.always():
                         m1 = self._matches(match)
                         m2 = m2._matches(match)
                         return m1.diff(m2, clean=clean)
                     result = {}
                     emptytree = treemanifest()
                     def _iterativediff(t1, t2, stack):
                         """compares two tree manifests and append new tree-manifests which
                         needs to be compared to stack"""
                         if t1._node == t2._node and not t1._dirty and not t2._dirty:
                             return
                         t1._load()
                         t2._load()
                         self._loaddifflazy(t1, t2)
                         for d, m1 in pycompat.iteritems(t1._dirs):
                             m2 = t2._dirs.get(d, emptytree)
                             stack.append((m1, m2))
                         for d, m2 in pycompat.iteritems(t2._dirs):
                             if d not in t1._dirs:
                                 stack.append((emptytree, m2))
                         for fn, n1 in pycompat.iteritems(t1._files):
                             fl1 = t1._flags.get(fn, b'')
                             n2 = t2._files.get(fn, None)
                             fl2 = t2._flags.get(fn, b'')
                             if n1 != n2 or fl1 != fl2:
                                 result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))
                             elif clean:
                                 result[t1._subpath(fn)] = None
                         for fn, n2 in pycompat.iteritems(t2._files):
                             if fn not in t1._files:
                                 fl2 = t2._flags.get(fn, b'')
                                 result[t2._subpath(fn)] = ((None, b''), (n2, fl2))
                     stackls = []
                     _iterativediff(self, m2, stackls)
                     while stackls:
                         t1, t2 = stackls.pop()
                         # stackls is populated in the function call
                         _iterativediff(t1, t2, stackls)
                     return result
                 def unmodifiedsince(self, m2):
                     return not self._dirty and not m2._dirty and self._node == m2._node
                 def parse(self, text, readsubtree):
                     selflazy = self._lazydirs
                     for f, n, fl in _parse(text):
                         if fl == b't':
                             f = f + b'/'
                             # False below means "doesn't need to be copied" and can use the
                             # cached value from readsubtree directly.
                             selflazy[f] = (n, readsubtree, False)
                         elif b'/' in f:
                             # This is a flat manifest, so use __setitem__ and setflag rather
                             # than assigning directly to _files and _flags, so we can
                             # assign a path in a subdirectory, and to mark dirty (compared
                             # to nullid).
                             self[f] = n
                             if fl:
                                 self.setflag(f, fl)
                         else:
                             # Assigning to _files and _flags avoids marking as dirty,
                             # and should be a little faster.
                             self._files[f] = n
                             if fl:
                                 self._flags[f] = fl
                 def text(self):
                     """Get the full data of this manifest as a bytestring."""
                     self._load()
                     return _text(self.iterentries())
                 def dirtext(self):
                     """Get the full data of this directory as a bytestring. Make sure that
                     any submanifests have been written first, so their nodeids are correct.
                     """
                     self._load()
                     flags = self.flags
                     lazydirs = [
                         (d[:-1], v[0], b't') for d, v in pycompat.iteritems(self._lazydirs)
                     ]
                     dirs = [(d[:-1], self._dirs[d]._node, b't') for d in self._dirs]
                     files = [(f, self._files[f], flags(f)) for f in self._files]
                     return _text(sorted(dirs + files + lazydirs))
                 def read(self, gettext, readsubtree):
                     def _load_for_read(s):
                         s.parse(gettext(), readsubtree)
                         s._dirty = False
                     self._loadfunc = _load_for_read
                 def writesubtrees(self, m1, m2, writesubtree, match):
                     self._load()  # for consistency; should never have any effect here
                     m1._load()
                     m2._load()
                     emptytree = treemanifest()
                     def getnode(m, d):
                         ld = m._lazydirs.get(d)
                         if ld:
                             return ld[0]
                         return m._dirs.get(d, emptytree)._node
                     # let's skip investigating things that `match` says we do not need.
                     visit = match.visitchildrenset(self._dir[:-1])
                     visit = self._loadchildrensetlazy(visit)
                     if visit == b'this' or visit == b'all':
                         visit = None
                     for d, subm in pycompat.iteritems(self._dirs):
                         if visit and d[:-1] not in visit:
                             continue
                         subp1 = getnode(m1, d)
                         subp2 = getnode(m2, d)
                         if subp1 == nullid:
                             subp1, subp2 = subp2, subp1
                         writesubtree(subm, subp1, subp2, match)
                 def walksubtrees(self, matcher=None):
                     """Returns an iterator of the subtrees of this manifest, including this
                     manifest itself.
                     If `matcher` is provided, it only returns subtrees that match.
                     """
                     if matcher and not matcher.visitdir(self._dir[:-1]):
                         return
                     if not matcher or matcher(self._dir[:-1]):
                         yield self
                     self._load()
                     # OPT: use visitchildrenset to avoid loading everything.
                     self._loadalllazy()
                     for d, subm in pycompat.iteritems(self._dirs):
                         for subtree in subm.walksubtrees(matcher=matcher):
                             yield subtree
             class manifestfulltextcache(util.lrucachedict):
                 """File-backed LRU cache for the manifest cache
                 File consists of entries, up to EOF:
                 - 20 bytes node, 4 bytes length, <length> manifest data
                 These are written in reverse cache order (oldest to newest).
                 """
                 _file = b'manifestfulltextcache'
                 def __init__(self, max):
                     super(manifestfulltextcache, self).__init__(max)
                     self._dirty = False
                     self._read = False
                     self._opener = None
                 def read(self):
                     if self._read or self._opener is None:
                         return
                     try:
                         with self._opener(self._file) as fp:
                             set = super(manifestfulltextcache, self).__setitem__
                             # ignore trailing data, this is a cache, corruption is skipped
                             while True:
                                 # TODO do we need to do work here for sha1 portability?
                                 node = fp.read(20)
                                 if len(node) < 20:
                                     break
                                 try:
                                     size = struct.unpack(b'>L', fp.read(4))[0]
                                 except struct.error:
                                     break
                                 value = bytearray(fp.read(size))
                                 if len(value) != size:
                                     break
                                 set(node, value)
                     except IOError:
                         # the file is allowed to be missing
                         pass
                     self._read = True
                     self._dirty = False
                 def write(self):
                     if not self._dirty or self._opener is None:
                         return
                     # rotate backwards to the first used node
                     try:
                         with self._opener(
                             self._file, b'w', atomictemp=True, checkambig=True
                         ) as fp:
                             node = self._head.prev
                             while True:
                                 if node.key in self._cache:
                                     fp.write(node.key)
                                     fp.write(struct.pack(b'>L', len(node.value)))
                                     fp.write(node.value)
                                 if node is self._head:
                                     break
                                 node = node.prev
                     except IOError:
                         # We could not write the cache (eg: permission error)
                         # the content can be missing.
                         #
                         # We could try harder and see if we could recreate a wcache
                         # directory were we coudl write too.
                         #
                         # XXX the error pass silently, having some way to issue an error
                         # log `ui.log` would be nice.
                         pass
                 def __len__(self):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).__len__()
                 def __contains__(self, k):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).__contains__(k)
                 def __iter__(self):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).__iter__()
                 def __getitem__(self, k):
                     if not self._read:
                         self.read()
                     # the cache lru order can change on read
                     setdirty = self._cache.get(k) is not self._head
                     value = super(manifestfulltextcache, self).__getitem__(k)
                     if setdirty:
                         self._dirty = True
                     return value
                 def __setitem__(self, k, v):
                     if not self._read:
                         self.read()
                     super(manifestfulltextcache, self).__setitem__(k, v)
                     self._dirty = True
                 def __delitem__(self, k):
                     if not self._read:
                         self.read()
                     super(manifestfulltextcache, self).__delitem__(k)
                     self._dirty = True
                 def get(self, k, default=None):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).get(k, default=default)
                 def clear(self, clear_persisted_data=False):
                     super(manifestfulltextcache, self).clear()
                     if clear_persisted_data:
                         self._dirty = True
                         self.write()
                     self._read = False
             # and upper bound of what we expect from compression
             # (real live value seems to be "3")
             MAXCOMPRESSION = 3
             class FastdeltaUnavailable(Exception):
                 """Exception raised when fastdelta isn't usable on a manifest."""
             @interfaceutil.implementer(repository.imanifeststorage)
             class manifestrevlog(object):
                 """A revlog that stores manifest texts. This is responsible for caching the
                 full-text manifest contents.
                 """
                 def __init__(
                     self,
                     opener,
                     tree=b'',
                     dirlogcache=None,
                     indexfile=None,
                     treemanifest=False,
                 ):
                     """Constructs a new manifest revlog
                     `indexfile` - used by extensions to have two manifests at once, like
                     when transitioning between flatmanifeset and treemanifests.
                     `treemanifest` - used to indicate this is a tree manifest revlog. Opener
                     options can also be used to make this a tree manifest revlog. The opener
                     option takes precedence, so if it is set to True, we ignore whatever
                     value is passed in to the constructor.
                     """
                     # During normal operations, we expect to deal with not more than four
                     # revs at a time (such as during commit --amend). When rebasing large
                     # stacks of commits, the number can go up, hence the config knob below.
                     cachesize = 4
                     optiontreemanifest = False
                     opts = getattr(opener, 'options', None)
                     if opts is not None:
                         cachesize = opts.get(b'manifestcachesize', cachesize)
                         optiontreemanifest = opts.get(b'treemanifest', False)
                     self._treeondisk = optiontreemanifest or treemanifest
                     self._fulltextcache = manifestfulltextcache(cachesize)
                     if tree:
                         assert self._treeondisk, b'opts is %r' % opts
                     if indexfile is None:
                         indexfile = b'00manifest.i'
                         if tree:
                             indexfile = b"meta/" + tree + indexfile
                     self.tree = tree
                     # The dirlogcache is kept on the root manifest log
                     if tree:
                         self._dirlogcache = dirlogcache
                     else:
                         self._dirlogcache = {b'': self}
                     self._revlog = revlog.revlog(
                         opener,
                         indexfile,
                         # only root indexfile is cached
                         checkambig=not bool(tree),
                         mmaplargeindex=True,
                         upperboundcomp=MAXCOMPRESSION,
                         persistentnodemap=opener.options.get(b'persistent-nodemap', False),
                     )
                     self.index = self._revlog.index
                     self.version = self._revlog.version
                     self._generaldelta = self._revlog._generaldelta
                 def _setupmanifestcachehooks(self, repo):
                     """Persist the manifestfulltextcache on lock release"""
                     if not util.safehasattr(repo, b'_wlockref'):
                         return
                     self._fulltextcache._opener = repo.wcachevfs
                     if repo._currentlock(repo._wlockref) is None:
                         return
                     reporef = weakref.ref(repo)
                     manifestrevlogref = weakref.ref(self)
                     def persistmanifestcache(success):
                         # Repo is in an unknown state, do not persist.
                         if not success:
                             return
                         repo = reporef()
                         self = manifestrevlogref()
                         if repo is None or self is None:
                             return
                         if repo.manifestlog.getstorage(b'') is not self:
                             # there's a different manifest in play now, abort
                             return
                         self._fulltextcache.write()
                     repo._afterlock(persistmanifestcache)
                 @property
                 def fulltextcache(self):
                     return self._fulltextcache
                 def clearcaches(self, clear_persisted_data=False):
                     self._revlog.clearcaches()
                     self._fulltextcache.clear(clear_persisted_data=clear_persisted_data)
                     self._dirlogcache = {self.tree: self}
                 def dirlog(self, d):
                     if d:
                         assert self._treeondisk
                     if d not in self._dirlogcache:
                         mfrevlog = manifestrevlog(
                             self.opener, d, self._dirlogcache, treemanifest=self._treeondisk
                         )
                         self._dirlogcache[d] = mfrevlog
                     return self._dirlogcache[d]
                 def add(
                     self,
                     m,
                     transaction,
                     link,
                     p1,
                     p2,
                     added,
                     removed,
                     readtree=None,
                     match=None,
                 ):
                     """add some manifest entry in to the manifest log
                     input:
                       m:           the manifest dict we want to store
                       transaction: the open transaction
                       p1:          manifest-node of p1
                       p2:          manifest-node of p2
                       added:       file added/changed compared to parent
                       removed:     file removed compared to parent
                     tree manifest input:
                       readtree:    a function to read a subtree
                       match:       a filematcher for the subpart of the tree manifest
                     """
                     try:
                         if p1 not in self.fulltextcache:
                             raise FastdeltaUnavailable()
                         # If our first parent is in the manifest cache, we can
                         # compute a delta here using properties we know about the
                         # manifest up-front, which may save time later for the
                         # revlog layer.
                         _checkforbidden(added)
                         # combine the changed lists into one sorted iterator
                         work = heapq.merge(
                             [(x, False) for x in sorted(added)],
                             [(x, True) for x in sorted(removed)],
                         )
                         arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)
                         cachedelta = self._revlog.rev(p1), deltatext
                         text = util.buffer(arraytext)
                         n = self._revlog.addrevision(
                             text, transaction, link, p1, p2, cachedelta
                         )
                     except FastdeltaUnavailable:
                         # The first parent manifest isn't already loaded or the
                         # manifest implementation doesn't support fastdelta, so
                         # we'll just encode a fulltext of the manifest and pass
                         # that through to the revlog layer, and let it handle the
                         # delta process.
                         if self._treeondisk:
                             assert readtree, b"readtree must be set for treemanifest writes"
                             assert match, b"match must be specified for treemanifest writes"
                             m1 = readtree(self.tree, p1)
                             m2 = readtree(self.tree, p2)
                             n = self._addtree(
                                 m, transaction, link, m1, m2, readtree, match=match
                             )
                             arraytext = None
                         else:
                             text = m.text()
                             n = self._revlog.addrevision(text, transaction, link, p1, p2)
                             arraytext = bytearray(text)
                     if arraytext is not None:
                         self.fulltextcache[n] = arraytext
                     return n
                 def _addtree(self, m, transaction, link, m1, m2, readtree, match):
                     # If the manifest is unchanged compared to one parent,
                     # don't write a new revision
                     if self.tree != b'' and (
                         m.unmodifiedsince(m1) or m.unmodifiedsince(m2)
                     ):
                         return m.node()
                     def writesubtree(subm, subp1, subp2, match):
                         sublog = self.dirlog(subm.dir())
                         sublog.add(
                             subm,
                             transaction,
                             link,
                             subp1,
                             subp2,
                             None,
                             None,
                             readtree=readtree,
                             match=match,
                         )
                     m.writesubtrees(m1, m2, writesubtree, match)
                     text = m.dirtext()
                     n = None
                     if self.tree != b'':
                         # Double-check whether contents are unchanged to one parent
                         if text == m1.dirtext():
                             n = m1.node()
                         elif text == m2.dirtext():
                             n = m2.node()
                     if not n:
                         n = self._revlog.addrevision(
                             text, transaction, link, m1.node(), m2.node()
                         )
                     # Save nodeid so parent manifest can calculate its nodeid
                     m.setnode(n)
                     return n
                 def __len__(self):
                     return len(self._revlog)
                 def __iter__(self):
                     return self._revlog.__iter__()
                 def rev(self, node):
                     return self._revlog.rev(node)
                 def node(self, rev):
                     return self._revlog.node(rev)
                 def lookup(self, value):
                     return self._revlog.lookup(value)
                 def parentrevs(self, rev):
                     return self._revlog.parentrevs(rev)
                 def parents(self, node):
                     return self._revlog.parents(node)
                 def linkrev(self, rev):
                     return self._revlog.linkrev(rev)
                 def checksize(self):
                     return self._revlog.checksize()
                 def revision(self, node, _df=None, raw=False):
                     return self._revlog.revision(node, _df=_df, raw=raw)
                 def rawdata(self, node, _df=None):
                     return self._revlog.rawdata(node, _df=_df)
                 def revdiff(self, rev1, rev2):
                     return self._revlog.revdiff(rev1, rev2)
                 def cmp(self, node, text):
                     return self._revlog.cmp(node, text)
                 def deltaparent(self, rev):
                     return self._revlog.deltaparent(rev)
                 def emitrevisions(
                     self,
                     nodes,
                     nodesorder=None,
                     revisiondata=False,
                     assumehaveparentrevisions=False,
                     deltamode=repository.CG_DELTAMODE_STD,
                 ):
                     return self._revlog.emitrevisions(
                         nodes,
                         nodesorder=nodesorder,
                         revisiondata=revisiondata,
                         assumehaveparentrevisions=assumehaveparentrevisions,
                         deltamode=deltamode,
                     )
                 def addgroup(
                     self,
                     deltas,
                     linkmapper,
                     transaction,
                     addrevisioncb=None,
                     duplicaterevisioncb=None,
                 ):
                     return self._revlog.addgroup(
                         deltas,
                         linkmapper,
                         transaction,
                         addrevisioncb=addrevisioncb,
                         duplicaterevisioncb=duplicaterevisioncb,
                     )
                 def rawsize(self, rev):
                     return self._revlog.rawsize(rev)
                 def getstrippoint(self, minlink):
                     return self._revlog.getstrippoint(minlink)
                 def strip(self, minlink, transaction):
                     return self._revlog.strip(minlink, transaction)
                 def files(self):
                     return self._revlog.files()
                 def clone(self, tr, destrevlog, **kwargs):
                     if not isinstance(destrevlog, manifestrevlog):
                         raise error.ProgrammingError(b'expected manifestrevlog to clone()')
                     return self._revlog.clone(tr, destrevlog._revlog, **kwargs)
                 def storageinfo(
                     self,
                     exclusivefiles=False,
                     sharedfiles=False,
                     revisionscount=False,
                     trackedsize=False,
                     storedsize=False,
                 ):
                     return self._revlog.storageinfo(
                         exclusivefiles=exclusivefiles,
                         sharedfiles=sharedfiles,
                         revisionscount=revisionscount,
                         trackedsize=trackedsize,
                         storedsize=storedsize,
                     )
                 @property
                 def indexfile(self):
                     return self._revlog.indexfile
                 @indexfile.setter
                 def indexfile(self, value):
                     self._revlog.indexfile = value
                 @property
                 def opener(self):
                     return self._revlog.opener
                 @opener.setter
                 def opener(self, value):
                     self._revlog.opener = value
             @interfaceutil.implementer(repository.imanifestlog)
             class manifestlog(object):
                 """A collection class representing the collection of manifest snapshots
                 referenced by commits in the repository.
                 In this situation, 'manifest' refers to the abstract concept of a snapshot
                 of the list of files in the given commit. Consumers of the output of this
                 class do not care about the implementation details of the actual manifests
                 they receive (i.e. tree or flat or lazily loaded, etc)."""
                 def __init__(self, opener, repo, rootstore, narrowmatch):
                     usetreemanifest = False
                     cachesize = 4
                     opts = getattr(opener, 'options', None)
                     if opts is not None:
                         usetreemanifest = opts.get(b'treemanifest', usetreemanifest)
                         cachesize = opts.get(b'manifestcachesize', cachesize)
                     self._treemanifests = usetreemanifest
                     self._rootstore = rootstore
                     self._rootstore._setupmanifestcachehooks(repo)
                     self._narrowmatch = narrowmatch
                     # A cache of the manifestctx or treemanifestctx for each directory
                     self._dirmancache = {}
                     self._dirmancache[b''] = util.lrucachedict(cachesize)
                     self._cachesize = cachesize
                 def __getitem__(self, node):
                     """Retrieves the manifest instance for the given node. Throws a
                     LookupError if not found.
                     """
                     return self.get(b'', node)
                 def get(self, tree, node, verify=True):
                     """Retrieves the manifest instance for the given node. Throws a
                     LookupError if not found.
                     `verify` - if True an exception will be thrown if the node is not in
                                the revlog
                     """
                     if node in self._dirmancache.get(tree, ()):
                         return self._dirmancache[tree][node]
                     if not self._narrowmatch.always():
                         if not self._narrowmatch.visitdir(tree[:-1]):
                             return excludeddirmanifestctx(tree, node)
                     if tree:
                         if self._rootstore._treeondisk:
                             if verify:
                                 # Side-effect is LookupError is raised if node doesn't
                                 # exist.
                                 self.getstorage(tree).rev(node)
                             m = treemanifestctx(self, tree, node)
                         else:
                             raise error.Abort(
                                 _(
                                     b"cannot ask for manifest directory '%s' in a flat "
                                     b"manifest"
                                 )
                                 % tree
                             )
                     else:
                         if verify:
                             # Side-effect is LookupError is raised if node doesn't exist.
                             self._rootstore.rev(node)
                         if self._treemanifests:
                             m = treemanifestctx(self, b'', node)
                         else:
                             m = manifestctx(self, node)
                     if node != nullid:
                         mancache = self._dirmancache.get(tree)
                         if not mancache:
                             mancache = util.lrucachedict(self._cachesize)
                             self._dirmancache[tree] = mancache
                         mancache[node] = m
                     return m
                 def getstorage(self, tree):
                     return self._rootstore.dirlog(tree)
                 def clearcaches(self, clear_persisted_data=False):
                     self._dirmancache.clear()
                     self._rootstore.clearcaches(clear_persisted_data=clear_persisted_data)
                 def rev(self, node):
                     return self._rootstore.rev(node)
                 def update_caches(self, transaction):
                     return self._rootstore._revlog.update_caches(transaction=transaction)
             @interfaceutil.implementer(repository.imanifestrevisionwritable)
             class memmanifestctx(object):
                 def __init__(self, manifestlog):
                     self._manifestlog = manifestlog
                     self._manifestdict = manifestdict()
                 def _storage(self):
                     return self._manifestlog.getstorage(b'')
                 def copy(self):
                     memmf = memmanifestctx(self._manifestlog)
                     memmf._manifestdict = self.read().copy()
                     return memmf
                 def read(self):
                     return self._manifestdict
                 def write(self, transaction, link, p1, p2, added, removed, match=None):
                     return self._storage().add(
                         self._manifestdict,
                         transaction,
                         link,
                         p1,
                         p2,
                         added,
                         removed,
                         match=match,
                     )
             @interfaceutil.implementer(repository.imanifestrevisionstored)
             class manifestctx(object):
                 """A class representing a single revision of a manifest, including its
                 contents, its parent revs, and its linkrev.
                 """
                 def __init__(self, manifestlog, node):
                     self._manifestlog = manifestlog
                     self._data = None
                     self._node = node
                     # TODO: We eventually want p1, p2, and linkrev exposed on this class,
                     # but let's add it later when something needs it and we can load it
                     # lazily.
                     # self.p1, self.p2 = store.parents(node)
                     # rev = store.rev(node)
                     # self.linkrev = store.linkrev(rev)
                 def _storage(self):
                     return self._manifestlog.getstorage(b'')
                 def node(self):
                     return self._node
                 def copy(self):
                     memmf = memmanifestctx(self._manifestlog)
                     memmf._manifestdict = self.read().copy()
                     return memmf
                 @propertycache
                 def parents(self):
                     return self._storage().parents(self._node)
                 def read(self):
                     if self._data is None:
                         if self._node == nullid:
                             self._data = manifestdict()
                         else:
                             store = self._storage()
                             if self._node in store.fulltextcache:
                                 text = pycompat.bytestr(store.fulltextcache[self._node])
                             else:
                                 text = store.revision(self._node)
                                 arraytext = bytearray(text)
                                 store.fulltextcache[self._node] = arraytext
                             self._data = manifestdict(text)
                     return self._data
                 def readfast(self, shallow=False):
                     """Calls either readdelta or read, based on which would be less work.
                     readdelta is called if the delta is against the p1, and therefore can be
                     read quickly.
                     If `shallow` is True, nothing changes since this is a flat manifest.
                     """
                     store = self._storage()
                     r = store.rev(self._node)
                     deltaparent = store.deltaparent(r)
                     if deltaparent != nullrev and deltaparent in store.parentrevs(r):
                         return self.readdelta()
                     return self.read()
                 def readdelta(self, shallow=False):
                     """Returns a manifest containing just the entries that are present
                     in this manifest, but not in its p1 manifest. This is efficient to read
                     if the revlog delta is already p1.
                     Changing the value of `shallow` has no effect on flat manifests.
                     """
                     store = self._storage()
                     r = store.rev(self._node)
                     d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))
                     return manifestdict(d)
                 def find(self, key):
                     return self.read().find(key)
             @interfaceutil.implementer(repository.imanifestrevisionwritable)
             class memtreemanifestctx(object):
                 def __init__(self, manifestlog, dir=b''):
                     self._manifestlog = manifestlog
                     self._dir = dir
                     self._treemanifest = treemanifest()
                 def _storage(self):
                     return self._manifestlog.getstorage(b'')
                 def copy(self):
                     memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)
                     memmf._treemanifest = self._treemanifest.copy()
                     return memmf
                 def read(self):
                     return self._treemanifest
                 def write(self, transaction, link, p1, p2, added, removed, match=None):
                     def readtree(dir, node):
                         return self._manifestlog.get(dir, node).read()
                     return self._storage().add(
                         self._treemanifest,
                         transaction,
                         link,
                         p1,
                         p2,
                         added,
                         removed,
                         readtree=readtree,
                         match=match,
                     )
             @interfaceutil.implementer(repository.imanifestrevisionstored)
             class treemanifestctx(object):
                 def __init__(self, manifestlog, dir, node):
                     self._manifestlog = manifestlog
                     self._dir = dir
                     self._data = None
                     self._node = node
                     # TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that
                     # we can instantiate treemanifestctx objects for directories we don't
                     # have on disk.
                     # self.p1, self.p2 = store.parents(node)
                     # rev = store.rev(node)
                     # self.linkrev = store.linkrev(rev)
                 def _storage(self):
                     narrowmatch = self._manifestlog._narrowmatch
                     if not narrowmatch.always():
                         if not narrowmatch.visitdir(self._dir[:-1]):
                             return excludedmanifestrevlog(self._dir)
                     return self._manifestlog.getstorage(self._dir)
                 def read(self):
                     if self._data is None:
                         store = self._storage()
                         if self._node == nullid:
                             self._data = treemanifest()
                         # TODO accessing non-public API
                         elif store._treeondisk:
                             m = treemanifest(dir=self._dir)
                             def gettext():
                                 return store.revision(self._node)
                             def readsubtree(dir, subm):
                                 # Set verify to False since we need to be able to create
                                 # subtrees for trees that don't exist on disk.
                                 return self._manifestlog.get(dir, subm, verify=False).read()
                             m.read(gettext, readsubtree)
                             m.setnode(self._node)
                             self._data = m
                         else:
                             if self._node in store.fulltextcache:
                                 text = pycompat.bytestr(store.fulltextcache[self._node])
                             else:
                                 text = store.revision(self._node)
                                 arraytext = bytearray(text)
                                 store.fulltextcache[self._node] = arraytext
                             self._data = treemanifest(dir=self._dir, text=text)
                     return self._data
                 def node(self):
                     return self._node
                 def copy(self):
                     memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)
                     memmf._treemanifest = self.read().copy()
                     return memmf
                 @propertycache
                 def parents(self):
                     return self._storage().parents(self._node)
                 def readdelta(self, shallow=False):
                     """Returns a manifest containing just the entries that are present
                     in this manifest, but not in its p1 manifest. This is efficient to read
                     if the revlog delta is already p1.
                     If `shallow` is True, this will read the delta for this directory,
                     without recursively reading subdirectory manifests. Instead, any
                     subdirectory entry will be reported as it appears in the manifest, i.e.
                     the subdirectory will be reported among files and distinguished only by
                     its 't' flag.
                     """
                     store = self._storage()
                     if shallow:
                         r = store.rev(self._node)
                         d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))
                         return manifestdict(d)
                     else:
                         # Need to perform a slow delta
                         r0 = store.deltaparent(store.rev(self._node))
                         m0 = self._manifestlog.get(self._dir, store.node(r0)).read()
                         m1 = self.read()
                         md = treemanifest(dir=self._dir)
                         for f, ((n0, fl0), (n1, fl1)) in pycompat.iteritems(m0.diff(m1)):
                             if n1:
                                 md[f] = n1
                                 if fl1:
                                     md.setflag(f, fl1)
                         return md
                 def readfast(self, shallow=False):
                     """Calls either readdelta or read, based on which would be less work.
                     readdelta is called if the delta is against the p1, and therefore can be
                     read quickly.
                     If `shallow` is True, it only returns the entries from this manifest,
                     and not any submanifests.
                     """
                     store = self._storage()
                     r = store.rev(self._node)
                     deltaparent = store.deltaparent(r)
                     if deltaparent != nullrev and deltaparent in store.parentrevs(r):
                         return self.readdelta(shallow=shallow)
                     if shallow:
                         return manifestdict(store.revision(self._node))
                     else:
                         return self.read()
                 def find(self, key):
                     return self.read().find(key)
             class excludeddir(treemanifest):
                 """Stand-in for a directory that is excluded from the repository.
                 With narrowing active on a repository that uses treemanifests,
                 some of the directory revlogs will be excluded from the resulting
                 clone. This is a huge storage win for clients, but means we need
                 some sort of pseudo-manifest to surface to internals so we can
                 detect a merge conflict outside the narrowspec. That's what this
                 class is: it stands in for a directory whose node is known, but
                 whose contents are unknown.
                 """
                 def __init__(self, dir, node):
                     super(excludeddir, self).__init__(dir)
                     self._node = node
                     # Add an empty file, which will be included by iterators and such,
                     # appearing as the directory itself (i.e. something like "dir/")
                     self._files[b''] = node
                     self._flags[b''] = b't'
                 # Manifests outside the narrowspec should never be modified, so avoid
                 # copying. This makes a noticeable difference when there are very many
                 # directories outside the narrowspec. Also, it makes sense for the copy to
                 # be of the same type as the original, which would not happen with the
                 # super type's copy().
                 def copy(self):
                     return self
             class excludeddirmanifestctx(treemanifestctx):
                 """context wrapper for excludeddir - see that docstring for rationale"""
                 def __init__(self, dir, node):
                     self._dir = dir
                     self._node = node
                 def read(self):
                     return excludeddir(self._dir, self._node)
+                def readfast(self, shallow=False):
+                    # special version of readfast since we don't have underlying storage
+                    return self.read()
                 def write(self, *args):
                     raise error.ProgrammingError(
                         b'attempt to write manifest from excluded dir %s' % self._dir
                     )
             class excludedmanifestrevlog(manifestrevlog):
                 """Stand-in for excluded treemanifest revlogs.
                 When narrowing is active on a treemanifest repository, we'll have
                 references to directories we can't see due to the revlog being
                 skipped. This class exists to conform to the manifestrevlog
                 interface for those directories and proactively prevent writes to
                 outside the narrowspec.
                 """
                 def __init__(self, dir):
                     self._dir = dir
                 def __len__(self):
                     raise error.ProgrammingError(
                         b'attempt to get length of excluded dir %s' % self._dir
                     )
                 def rev(self, node):
                     raise error.ProgrammingError(
                         b'attempt to get rev from excluded dir %s' % self._dir
                     )
                 def linkrev(self, node):
                     raise error.ProgrammingError(
                         b'attempt to get linkrev from excluded dir %s' % self._dir
                     )
                 def node(self, rev):
                     raise error.ProgrammingError(
                         b'attempt to get node from excluded dir %s' % self._dir
                     )
                 def add(self, *args, **kwargs):
                     # We should never write entries in dirlogs outside the narrow clone.
                     # However, the method still gets called from writesubtree() in
                     # _addtree(), so we need to handle it. We should possibly make that
                     # avoid calling add() with a clean manifest (_dirty is always False
                     # in excludeddir instances).
                     pass