upstream/mercurial-mirror Commit - r45198:f0d88d20

1

# manifest.py - manifest revision class for mercurial

1

# manifest.py - manifest revision class for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import heapq

10

import heapq

11

import itertools

11

import itertools

12

import struct

12

import struct

13

import weakref

13

import weakref

14

15

from .i18n import _

15

from .i18n import _

16

from .node import (

16

from .node import (

17

bin,

17

bin,

18

hex,

18

hex,

19

nullid,

19

nullid,

20

nullrev,

20

nullrev,

21

)

21

)

22

from .pycompat import getattr

22

from .pycompat import getattr

23

from . import (

23

from . import (

24

encoding,

24

encoding,

25

error,

25

error,

26

match as matchmod,

26

match as matchmod,

27

mdiff,

27

mdiff,

28

pathutil,

28

pathutil,

29

policy,

29

policy,

30

pycompat,

30

pycompat,

31

revlog,

31

revlog,

32

util,

32

util,

33

)

33

)

34

from .interfaces import (

34

from .interfaces import (

35

repository,

35

repository,

36

util as interfaceutil,

36

util as interfaceutil,

37

)

37

)

38

39

parsers = policy.importmod('parsers')

39

parsers = policy.importmod('parsers')

40

propertycache = util.propertycache

40

propertycache = util.propertycache

41

42

# Allow tests to more easily test the alternate path in manifestdict.fastdelta()

42

# Allow tests to more easily test the alternate path in manifestdict.fastdelta()

43

FASTDELTA_TEXTDIFF_THRESHOLD = 1000

43

FASTDELTA_TEXTDIFF_THRESHOLD = 1000

44

45

46

def _parse(data):

46

def _parse(data):

47

# This method does a little bit of excessive-looking

47

# This method does a little bit of excessive-looking

48

# precondition checking. This is so that the behavior of this

48

# precondition checking. This is so that the behavior of this

49

# class exactly matches its C counterpart to try and help

49

# class exactly matches its C counterpart to try and help

50

# prevent surprise breakage for anyone that develops against

50

# prevent surprise breakage for anyone that develops against

51

# the pure version.

51

# the pure version.

52

if data and data[-1:] != b'\n':

52

if data and data[-1:] != b'\n':

53

raise ValueError(b'Manifest did not end in a newline.')

53

raise ValueError(b'Manifest did not end in a newline.')

54

prev = None

54

prev = None

55

for l in data.splitlines():

55

for l in data.splitlines():

56

if prev is not None and prev > l:

56

if prev is not None and prev > l:

57

raise ValueError(b'Manifest lines not in sorted order.')

57

raise ValueError(b'Manifest lines not in sorted order.')

58

prev = l

58

prev = l

59

f, n = l.split(b'\0')

59

f, n = l.split(b'\0')

60

nl = len(n)

60

nl = len(n)

61

if 64 < nl:

61

if 64 < nl:

62

# modern hash, full width

62

# modern hash, full width

63

yield f, bin(n[:64]), n[64:]

63

yield f, bin(n[:64]), n[64:]

64

if 40 < nl < 45:

64

if 40 < nl < 45:

65

# legacy hash, always sha1

65

# legacy hash, always sha1

66

yield f, bin(n[:40]), n[40:]

66

yield f, bin(n[:40]), n[40:]

67

else:

67

else:

68

yield f, bin(n), b''

68

yield f, bin(n), b''

69

70

71

def _text(it):

71

def _text(it):

72

files = []

72

files = []

73

lines = []

73

lines = []

74

for f, n, fl in it:

74

for f, n, fl in it:

75

files.append(f)

75

files.append(f)

76

# if this is changed to support newlines in filenames,

76

# if this is changed to support newlines in filenames,

77

# be sure to check the templates/ dir again (especially *-raw.tmpl)

77

# be sure to check the templates/ dir again (especially *-raw.tmpl)

78

lines.append(b"%s\0%s%s\n" % (f, hex(n), fl))

78

lines.append(b"%s\0%s%s\n" % (f, hex(n), fl))

79

80

_checkforbidden(files)

80

_checkforbidden(files)

81

return b''.join(lines)

81

return b''.join(lines)

82

83

84

class lazymanifestiter(object):

84

class lazymanifestiter(object):

85

def __init__(self, lm):

85

def __init__(self, lm):

86

self.pos = 0

86

self.pos = 0

87

self.lm = lm

87

self.lm = lm

88

89

def __iter__(self):

89

def __iter__(self):

90

return self

90

return self

91

92

def next(self):

92

def next(self):

93

try:

93

try:

94

data, pos = self.lm._get(self.pos)

94

data, pos = self.lm._get(self.pos)

95

except IndexError:

95

except IndexError:

96

raise StopIteration

96

raise StopIteration

97

if pos == -1:

97

if pos == -1:

98

self.pos += 1

98

self.pos += 1

99

return data[0]

99

return data[0]

100

self.pos += 1

100

self.pos += 1

101

zeropos = data.find(b'\x00', pos)

101

zeropos = data.find(b'\x00', pos)

102

return data[pos:zeropos]

102

return data[pos:zeropos]

103

104

__next__ = next

104

__next__ = next

105

106

107

class lazymanifestiterentries(object):

107

class lazymanifestiterentries(object):

108

def __init__(self, lm):

108

def __init__(self, lm):

109

self.lm = lm

109

self.lm = lm

110

self.pos = 0

110

self.pos = 0

111

112

def __iter__(self):

112

def __iter__(self):

113

return self

113

return self

114

115

def next(self):

115

def next(self):

116

try:

116

try:

117

data, pos = self.lm._get(self.pos)

117

data, pos = self.lm._get(self.pos)

118

except IndexError:

118

except IndexError:

119

raise StopIteration

119

raise StopIteration

120

if pos == -1:

120

if pos == -1:

121

self.pos += 1

121

self.pos += 1

122

return data

122

return data

123

zeropos = data.find(b'\x00', pos)

123

zeropos = data.find(b'\x00', pos)

124

hashval = unhexlify(data, self.lm.extrainfo[self.pos], zeropos + 1, 40)

124

hashval = unhexlify(data, self.lm.extrainfo[self.pos], zeropos + 1, 40)

125

flags = self.lm._getflags(data, self.pos, zeropos)

125

flags = self.lm._getflags(data, self.pos, zeropos)

126

self.pos += 1

126

self.pos += 1

127

return (data[pos:zeropos], hashval, flags)

127

return (data[pos:zeropos], hashval, flags)

128

129

__next__ = next

129

__next__ = next

130

131

132

def unhexlify(data, extra, pos, length):

132

def unhexlify(data, extra, pos, length):

133

s = bin(data[pos : pos + length])

133

s = bin(data[pos : pos + length])

134

if extra:

134

if extra:

135

s += chr(extra & 0xFF)

135

s += chr(extra & 0xFF)

136

return s

136

return s

137

138

139

def _cmp(a, b):

139

def _cmp(a, b):

140

return (a > b) - (a < b)

140

return (a > b) - (a < b)

141

142

143

class _lazymanifest(object):

143

class _lazymanifest(object):

144

"""A pure python manifest backed by a byte string. It is supplimented with

144

"""A pure python manifest backed by a byte string. It is supplimented with

145

internal lists as it is modified, until it is compacted back to a pure byte

145

internal lists as it is modified, until it is compacted back to a pure byte

146

string.

146

string.

147

148

``data`` is the initial manifest data.

148

``data`` is the initial manifest data.

149

150

``positions`` is a list of offsets, one per manifest entry. Positive

150

``positions`` is a list of offsets, one per manifest entry. Positive

151

values are offsets into ``data``, negative values are offsets into the

151

values are offsets into ``data``, negative values are offsets into the

152

``extradata`` list. When an entry is removed, its entry is dropped from

152

``extradata`` list. When an entry is removed, its entry is dropped from

153

``positions``. The values are encoded such that when walking the list and

153

``positions``. The values are encoded such that when walking the list and

154

indexing into ``data`` or ``extradata`` as appropriate, the entries are

154

indexing into ``data`` or ``extradata`` as appropriate, the entries are

155

sorted by filename.

155

sorted by filename.

156

157

``extradata`` is a list of (key, hash, flags) for entries that were added or

157

``extradata`` is a list of (key, hash, flags) for entries that were added or

158

modified since the manifest was created or compacted.

158

modified since the manifest was created or compacted.

159

"""

159

"""

160

161

def __init__(

161

def __init__(

162

self,

162

self,

163

data,

163

data,

164

positions=None,

164

positions=None,

165

extrainfo=None,

165

extrainfo=None,

166

extradata=None,

166

extradata=None,

167

hasremovals=False,

167

hasremovals=False,

168

):

168

):

169

if positions is None:

169

if positions is None:

170

self.positions = self.findlines(data)

170

self.positions = self.findlines(data)

171

self.extrainfo = [0] * len(self.positions)

171

self.extrainfo = [0] * len(self.positions)

172

self.data = data

172

self.data = data

173

self.extradata = []

173

self.extradata = []

174

self.hasremovals = False

174

self.hasremovals = False

175

else:

175

else:

176

self.positions = positions[:]

176

self.positions = positions[:]

177

self.extrainfo = extrainfo[:]

177

self.extrainfo = extrainfo[:]

178

self.extradata = extradata[:]

178

self.extradata = extradata[:]

179

self.data = data

179

self.data = data

180

self.hasremovals = hasremovals

180

self.hasremovals = hasremovals

181

182

def findlines(self, data):

182

def findlines(self, data):

183

if not data:

183

if not data:

184

return []

184

return []

185

pos = data.find(b"\n")

185

pos = data.find(b"\n")

186

if pos == -1 or data[-1:] != b'\n':

186

if pos == -1 or data[-1:] != b'\n':

187

raise ValueError(b"Manifest did not end in a newline.")

187

raise ValueError(b"Manifest did not end in a newline.")

188

positions = [0]

188

positions = [0]

189

prev = data[: data.find(b'\x00')]

189

prev = data[: data.find(b'\x00')]

190

while pos < len(data) - 1 and pos != -1:

190

while pos < len(data) - 1 and pos != -1:

191

positions.append(pos + 1)

191

positions.append(pos + 1)

192

nexts = data[pos + 1 : data.find(b'\x00', pos + 1)]

192

nexts = data[pos + 1 : data.find(b'\x00', pos + 1)]

193

if nexts < prev:

193

if nexts < prev:

194

raise ValueError(b"Manifest lines not in sorted order.")

194

raise ValueError(b"Manifest lines not in sorted order.")

195

prev = nexts

195

prev = nexts

196

pos = data.find(b"\n", pos + 1)

196

pos = data.find(b"\n", pos + 1)

197

return positions

197

return positions

198

199

def _get(self, index):

199

def _get(self, index):

200

# get the position encoded in pos:

200

# get the position encoded in pos:

201

# positive number is an index in 'data'

201

# positive number is an index in 'data'

202

# negative number is in extrapieces

202

# negative number is in extrapieces

203

pos = self.positions[index]

203

pos = self.positions[index]

204

if pos >= 0:

204

if pos >= 0:

205

return self.data, pos

205

return self.data, pos

206

return self.extradata[-pos - 1], -1

206

return self.extradata[-pos - 1], -1

207

208

def _getkey(self, pos):

208

def _getkey(self, pos):

209

if pos >= 0:

209

if pos >= 0:

210

return self.data[pos : self.data.find(b'\x00', pos + 1)]

210

return self.data[pos : self.data.find(b'\x00', pos + 1)]

211

return self.extradata[-pos - 1][0]

211

return self.extradata[-pos - 1][0]

212

213

def bsearch(self, key):

213

def bsearch(self, key):

214

first = 0

214

first = 0

215

last = len(self.positions) - 1

215

last = len(self.positions) - 1

216

217

while first <= last:

217

while first <= last:

218

midpoint = (first + last) // 2

218

midpoint = (first + last) // 2

219

nextpos = self.positions[midpoint]

219

nextpos = self.positions[midpoint]

220

candidate = self._getkey(nextpos)

220

candidate = self._getkey(nextpos)

221

r = _cmp(key, candidate)

221

r = _cmp(key, candidate)

222

if r == 0:

222

if r == 0:

223

return midpoint

223

return midpoint

224

else:

224

else:

225

if r < 0:

225

if r < 0:

226

last = midpoint - 1

226

last = midpoint - 1

227

else:

227

else:

228

first = midpoint + 1

228

first = midpoint + 1

229

return -1

229

return -1

230

231

def bsearch2(self, key):

231

def bsearch2(self, key):

232

# same as the above, but will always return the position

232

# same as the above, but will always return the position

233

# done for performance reasons

233

# done for performance reasons

234

first = 0

234

first = 0

235

last = len(self.positions) - 1

235

last = len(self.positions) - 1

236

237

while first <= last:

237

while first <= last:

238

midpoint = (first + last) // 2

238

midpoint = (first + last) // 2

239

nextpos = self.positions[midpoint]

239

nextpos = self.positions[midpoint]

240

candidate = self._getkey(nextpos)

240

candidate = self._getkey(nextpos)

241

r = _cmp(key, candidate)

241

r = _cmp(key, candidate)

242

if r == 0:

242

if r == 0:

243

return (midpoint, True)

243

return (midpoint, True)

244

else:

244

else:

245

if r < 0:

245

if r < 0:

246

last = midpoint - 1

246

last = midpoint - 1

247

else:

247

else:

248

first = midpoint + 1

248

first = midpoint + 1

249

return (first, False)

249

return (first, False)

250

251

def __contains__(self, key):

251

def __contains__(self, key):

252

return self.bsearch(key) != -1

252

return self.bsearch(key) != -1

253

254

def _getflags(self, data, needle, pos):

254

def _getflags(self, data, needle, pos):

255

start = pos + 41

255

start = pos + 41

256

end = data.find(b"\n", start)

256

end = data.find(b"\n", start)

257

if end == -1:

257

if end == -1:

258

end = len(data) - 1

258

end = len(data) - 1

259

if start == end:

259

if start == end:

260

return b''

260

return b''

261

return self.data[start:end]

261

return self.data[start:end]

262

263

def __getitem__(self, key):

263

def __getitem__(self, key):

264

if not isinstance(key, bytes):

264

if not isinstance(key, bytes):

265

raise TypeError(b"getitem: manifest keys must be a bytes.")

265

raise TypeError(b"getitem: manifest keys must be a bytes.")

266

needle = self.bsearch(key)

266

needle = self.bsearch(key)

267

if needle == -1:

267

if needle == -1:

268

raise KeyError

268

raise KeyError

269

data, pos = self._get(needle)

269

data, pos = self._get(needle)

270

if pos == -1:

270

if pos == -1:

271

return (data[1], data[2])

271

return (data[1], data[2])

272

zeropos = data.find(b'\x00', pos)

272

zeropos = data.find(b'\x00', pos)

273

nlpos = data.find(b'\n', zeropos)

273

nlpos = data.find(b'\n', zeropos)

274

assert 0 <= needle <= len(self.positions)

274

assert 0 <= needle <= len(self.positions)

275

assert len(self.extrainfo) == len(self.positions)

275

assert len(self.extrainfo) == len(self.positions)

276

hlen = nlpos - zeropos - 1

276

hlen = nlpos - zeropos - 1

277

# Hashes sometimes have an extra byte tucked on the end, so

277

# Hashes sometimes have an extra byte tucked on the end, so

278

# detect that.

278

# detect that.

279

if hlen % 2:

279

if hlen % 2:

280

hlen -= 1

280

hlen -= 1

281

hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, hlen)

281

hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, hlen)

282

flags = self._getflags(data, needle, zeropos)

282

flags = self._getflags(data, needle, zeropos)

283

return (hashval, flags)

283

return (hashval, flags)

284

285

def __delitem__(self, key):

285

def __delitem__(self, key):

286

needle, found = self.bsearch2(key)

286

needle, found = self.bsearch2(key)

287

if not found:

287

if not found:

288

raise KeyError

288

raise KeyError

289

cur = self.positions[needle]

289

cur = self.positions[needle]

290

self.positions = self.positions[:needle] + self.positions[needle + 1 :]

290

self.positions = self.positions[:needle] + self.positions[needle + 1 :]

291

self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1 :]

291

self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1 :]

292

if cur >= 0:

292

if cur >= 0:

293

# This does NOT unsort the list as far as the search functions are

293

# This does NOT unsort the list as far as the search functions are

294

# concerned, as they only examine lines mapped by self.positions.

294

# concerned, as they only examine lines mapped by self.positions.

295

self.data = self.data[:cur] + b'\x00' + self.data[cur + 1 :]

295

self.data = self.data[:cur] + b'\x00' + self.data[cur + 1 :]

296

self.hasremovals = True

296

self.hasremovals = True

297

298

def __setitem__(self, key, value):

298

def __setitem__(self, key, value):

299

if not isinstance(key, bytes):

299

if not isinstance(key, bytes):

300

raise TypeError(b"setitem: manifest keys must be a byte string.")

300

raise TypeError(b"setitem: manifest keys must be a byte string.")

301

if not isinstance(value, tuple) or len(value) != 2:

301

if not isinstance(value, tuple) or len(value) != 2:

302

raise TypeError(

302

raise TypeError(

303

b"Manifest values must be a tuple of (node, flags)."

303

b"Manifest values must be a tuple of (node, flags)."

304

)

304

)

305

hashval = value[0]

305

hashval = value[0]

306

# hashes are either 20 or 32 bytes (sha1 or its replacement),

306

# hashes are either 20 or 32 bytes (sha1 or its replacement),

307

# and allow one extra byte taht won't be persisted to disk but

307

# and allow one extra byte taht won't be persisted to disk but

308

# is sometimes used in memory.

308

# is sometimes used in memory.

309

if not isinstance(hashval, bytes) or not (

309

if not isinstance(hashval, bytes) or not (

310

20 <= len(hashval) <= 22 or 32 <= len(hashval) <= 34

310

20 <= len(hashval) <= 22 or 32 <= len(hashval) <= 34

311

):

311

):

312

raise TypeError(b"node must be a 20-byte or 32-byte byte string")

312

raise TypeError(b"node must be a 20-byte or 32-byte byte string")

313

flags = value[1]

313

flags = value[1]

314

if len(hashval) == 22:

314

if len(hashval) == 22:

315

hashval = hashval[:-1]

315

hashval = hashval[:-1]

316

if not isinstance(flags, bytes) or len(flags) > 1:

316

if not isinstance(flags, bytes) or len(flags) > 1:

317

raise TypeError(b"flags must a 0 or 1 byte string, got %r", flags)

317

raise TypeError(b"flags must a 0 or 1 byte string, got %r", flags)

318

needle, found = self.bsearch2(key)

318

needle, found = self.bsearch2(key)

319

if found:

319

if found:

320

# put the item

320

# put the item

321

pos = self.positions[needle]

321

pos = self.positions[needle]

322

if pos < 0:

322

if pos < 0:

323

self.extradata[-pos - 1] = (key, hashval, value[1])

323

self.extradata[-pos - 1] = (key, hashval, value[1])

324

else:

324

else:

325

# just don't bother

325

# just don't bother

326

self.extradata.append((key, hashval, value[1]))

326

self.extradata.append((key, hashval, value[1]))

327

self.positions[needle] = -len(self.extradata)

327

self.positions[needle] = -len(self.extradata)

328

else:

328

else:

329

# not found, put it in with extra positions

329

# not found, put it in with extra positions

330

self.extradata.append((key, hashval, value[1]))

330

self.extradata.append((key, hashval, value[1]))

331

self.positions = (

331

self.positions = (

332

self.positions[:needle]

332

self.positions[:needle]

333

+ [-len(self.extradata)]

333

+ [-len(self.extradata)]

334

+ self.positions[needle:]

334

+ self.positions[needle:]

335

)

335

)

336

self.extrainfo = (

336

self.extrainfo = (

337

self.extrainfo[:needle] + [0] + self.extrainfo[needle:]

337

self.extrainfo[:needle] + [0] + self.extrainfo[needle:]

338

)

338

)

339

340

def copy(self):

340

def copy(self):

341

# XXX call _compact like in C?

341

# XXX call _compact like in C?

342

return _lazymanifest(

342

return _lazymanifest(

343

self.data,

343

self.data,

344

self.positions,

344

self.positions,

345

self.extrainfo,

345

self.extrainfo,

346

self.extradata,

346

self.extradata,

347

self.hasremovals,

347

self.hasremovals,

348

)

348

)

349

350

def _compact(self):

350

def _compact(self):

351

# hopefully not called TOO often

351

# hopefully not called TOO often

352

if len(self.extradata) == 0 and not self.hasremovals:

352

if len(self.extradata) == 0 and not self.hasremovals:

353

return

353

return

354

l = []

354

l = []

355

i = 0

355

i = 0

356

offset = 0

356

offset = 0

357

self.extrainfo = [0] * len(self.positions)

357

self.extrainfo = [0] * len(self.positions)

358

while i < len(self.positions):

358

while i < len(self.positions):

359

if self.positions[i] >= 0:

359

if self.positions[i] >= 0:

360

cur = self.positions[i]

360

cur = self.positions[i]

361

last_cut = cur

361

last_cut = cur

362

363

# Collect all contiguous entries in the buffer at the current

363

# Collect all contiguous entries in the buffer at the current

364

# offset, breaking out only for added/modified items held in

364

# offset, breaking out only for added/modified items held in

365

# extradata, or a deleted line prior to the next position.

365

# extradata, or a deleted line prior to the next position.

366

while True:

366

while True:

367

self.positions[i] = offset

367

self.positions[i] = offset

368

i += 1

368

i += 1

369

if i == len(self.positions) or self.positions[i] < 0:

369

if i == len(self.positions) or self.positions[i] < 0:

370

break

370

break

371

372

# A removed file has no positions[] entry, but does have an

372

# A removed file has no positions[] entry, but does have an

373

# overwritten first byte. Break out and find the end of the

373

# overwritten first byte. Break out and find the end of the

374

# current good entry/entries if there is a removed file

374

# current good entry/entries if there is a removed file

375

# before the next position.

375

# before the next position.

376

if (

376

if (

377

self.hasremovals

377

self.hasremovals

378

and self.data.find(b'\n\x00', cur, self.positions[i])

378

and self.data.find(b'\n\x00', cur, self.positions[i])

379

!= -1

379

!= -1

380

):

380

):

381

break

381

break

382

383

offset += self.positions[i] - cur

383

offset += self.positions[i] - cur

384

cur = self.positions[i]

384

cur = self.positions[i]

385

end_cut = self.data.find(b'\n', cur)

385

end_cut = self.data.find(b'\n', cur)

386

if end_cut != -1:

386

if end_cut != -1:

387

end_cut += 1

387

end_cut += 1

388

offset += end_cut - cur

388

offset += end_cut - cur

389

l.append(self.data[last_cut:end_cut])

389

l.append(self.data[last_cut:end_cut])

390

else:

390

else:

391

while i < len(self.positions) and self.positions[i] < 0:

391

while i < len(self.positions) and self.positions[i] < 0:

392

cur = self.positions[i]

392

cur = self.positions[i]

393

t = self.extradata[-cur - 1]

393

t = self.extradata[-cur - 1]

394

l.append(self._pack(t))

394

l.append(self._pack(t))

395

self.positions[i] = offset

395

self.positions[i] = offset

396

# Hashes are either 20 bytes (old sha1s) or 32

396

# Hashes are either 20 bytes (old sha1s) or 32

397

# bytes (new non-sha1).

397

# bytes (new non-sha1).

398

hlen = 20

398

hlen = 20

399

if len(t[1]) > 25:

399

if len(t[1]) > 25:

400

hlen = 32

400

hlen = 32

401

if len(t[1]) > hlen:

401

if len(t[1]) > hlen:

402

self.extrainfo[i] = ord(t[1][hlen + 1])

402

self.extrainfo[i] = ord(t[1][hlen + 1])

403

offset += len(l[-1])

403

offset += len(l[-1])

404

i += 1

404

i += 1

405

self.data = b''.join(l)

405

self.data = b''.join(l)

406

self.hasremovals = False

406

self.hasremovals = False

407

self.extradata = []

407

self.extradata = []

408

409

def _pack(self, d):

409

def _pack(self, d):

410

n = d[1]

410

n = d[1]

411

if len(n) == 21 or len(n) == 33:

411

if len(n) == 21 or len(n) == 33:

412

n = n[:-1]

412

n = n[:-1]

413

assert len(n) == 20 or len(n) == 32

413

assert len(n) == 20 or len(n) == 32

414

return d[0] + b'\x00' + hex(n) + d[2] + b'\n'

414

return d[0] + b'\x00' + hex(n) + d[2] + b'\n'

415

416

def text(self):

416

def text(self):

417

self._compact()

417

self._compact()

418

return self.data

418

return self.data

419

420

def diff(self, m2, clean=False):

420

def diff(self, m2, clean=False):

421

'''Finds changes between the current manifest and m2.'''

421

'''Finds changes between the current manifest and m2.'''

422

# XXX think whether efficiency matters here

422

# XXX think whether efficiency matters here

423

diff = {}

423

diff = {}

424

425

for fn, e1, flags in self.iterentries():

425

for fn, e1, flags in self.iterentries():

426

if fn not in m2:

426

if fn not in m2:

427

diff[fn] = (e1, flags), (None, b'')

427

diff[fn] = (e1, flags), (None, b'')

428

else:

428

else:

429

e2 = m2[fn]

429

e2 = m2[fn]

430

if (e1, flags) != e2:

430

if (e1, flags) != e2:

431

diff[fn] = (e1, flags), e2

431

diff[fn] = (e1, flags), e2

432

elif clean:

432

elif clean:

433

diff[fn] = None

433

diff[fn] = None

434

435

for fn, e2, flags in m2.iterentries():

435

for fn, e2, flags in m2.iterentries():

436

if fn not in self:

436

if fn not in self:

437

diff[fn] = (None, b''), (e2, flags)

437

diff[fn] = (None, b''), (e2, flags)

438

439

return diff

439

return diff

440

441

def iterentries(self):

441

def iterentries(self):

442

return lazymanifestiterentries(self)

442

return lazymanifestiterentries(self)

443

444

def iterkeys(self):

444

def iterkeys(self):

445

return lazymanifestiter(self)

445

return lazymanifestiter(self)

446

447

def __iter__(self):

447

def __iter__(self):

448

return lazymanifestiter(self)

448

return lazymanifestiter(self)

449

450

def __len__(self):

450

def __len__(self):

451

return len(self.positions)

451

return len(self.positions)

452

453

def filtercopy(self, filterfn):

453

def filtercopy(self, filterfn):

454

# XXX should be optimized

454

# XXX should be optimized

455

c = _lazymanifest(b'')

455

c = _lazymanifest(b'')

456

for f, n, fl in self.iterentries():

456

for f, n, fl in self.iterentries():

457

if filterfn(f):

457

if filterfn(f):

458

c[f] = n, fl

458

c[f] = n, fl

459

return c

459

return c

460

461

462

try:

462

try:

463

_lazymanifest = parsers.lazymanifest

463

_lazymanifest = parsers.lazymanifest

464

except AttributeError:

464

except AttributeError:

465

pass

465

pass

466

467

468

@interfaceutil.implementer(repository.imanifestdict)

468

@interfaceutil.implementer(repository.imanifestdict)

469

class manifestdict(object):

469

class manifestdict(object):

470

def __init__(self, data=b''):

470

def __init__(self, data=b''):

471

self._lm = _lazymanifest(data)

471

self._lm = _lazymanifest(data)

472

473

def __getitem__(self, key):

473

def __getitem__(self, key):

474

return self._lm[key][0]

474

return self._lm[key][0]

475

476

def find(self, key):

476

def find(self, key):

477

return self._lm[key]

477

return self._lm[key]

478

479

def __len__(self):

479

def __len__(self):

480

return len(self._lm)

480

return len(self._lm)

481

482

def __nonzero__(self):

482

def __nonzero__(self):

483

# nonzero is covered by the __len__ function, but implementing it here

483

# nonzero is covered by the __len__ function, but implementing it here

484

# makes it easier for extensions to override.

484

# makes it easier for extensions to override.

485

return len(self._lm) != 0

485

return len(self._lm) != 0

486

487

__bool__ = __nonzero__

487

__bool__ = __nonzero__

488

489

def __setitem__(self, key, node):

489

def __setitem__(self, key, node):

490

self._lm[key] = node, self.flags(key)

490

self._lm[key] = node, self.flags(key)

491

492

def __contains__(self, key):

492

def __contains__(self, key):

493

if key is None:

493

if key is None:

494

return False

494

return False

495

return key in self._lm

495

return key in self._lm

496

497

def __delitem__(self, key):

497

def __delitem__(self, key):

498

del self._lm[key]

498

del self._lm[key]

499

500

def __iter__(self):

500

def __iter__(self):

501

return self._lm.__iter__()

501

return self._lm.__iter__()

502

503

def iterkeys(self):

503

def iterkeys(self):

504

return self._lm.iterkeys()

504

return self._lm.iterkeys()

505

506

def keys(self):

506

def keys(self):

507

return list(self.iterkeys())

507

return list(self.iterkeys())

508

509

def filesnotin(self, m2, match=None):

509

def filesnotin(self, m2, match=None):

510

'''Set of files in this manifest that are not in the other'''

510

'''Set of files in this manifest that are not in the other'''

511

if match is not None:

511

if match is not None:

512

match = matchmod.badmatch(match, lambda path, msg: None)

512

match = matchmod.badmatch(match, lambda path, msg: None)

513

sm2 = set(m2.walk(match))

513

sm2 = set(m2.walk(match))

514

return {f for f in self.walk(match) if f not in sm2}

514

return {f for f in self.walk(match) if f not in sm2}

515

return {f for f in self if f not in m2}

515

return {f for f in self if f not in m2}

516

517

@propertycache

517

@propertycache

518

def _dirs(self):

518

def _dirs(self):

519

return pathutil.dirs(self)

519

return pathutil.dirs(self)

520

521

def dirs(self):

521

def dirs(self):

522

return self._dirs

522

return self._dirs

523

524

def hasdir(self, dir):

524

def hasdir(self, dir):

525

return dir in self._dirs

525

return dir in self._dirs

526

527

def _filesfastpath(self, match):

527

def _filesfastpath(self, match):

528

'''Checks whether we can correctly and quickly iterate over matcher

528

'''Checks whether we can correctly and quickly iterate over matcher

529

files instead of over manifest files.'''

529

files instead of over manifest files.'''

530

files = match.files()

530

files = match.files()

531

return len(files) < 100 and (

531

return len(files) < 100 and (

532

match.isexact()

532

match.isexact()

533

or (match.prefix() and all(fn in self for fn in files))

533

or (match.prefix() and all(fn in self for fn in files))

534

)

534

)

535

536

def walk(self, match):

536

def walk(self, match):

537

'''Generates matching file names.

537

'''Generates matching file names.

538

539

Equivalent to manifest.matches(match).iterkeys(), but without creating

539

Equivalent to manifest.matches(match).iterkeys(), but without creating

540

an entirely new manifest.

540

an entirely new manifest.

541

542

It also reports nonexistent files by marking them bad with match.bad().

542

It also reports nonexistent files by marking them bad with match.bad().

543

'''

543

'''

544

if match.always():

544

if match.always():

545

for f in iter(self):

545

for f in iter(self):

546

yield f

546

yield f

547

return

547

return

548

549

fset = set(match.files())

549

fset = set(match.files())

550

551

# avoid the entire walk if we're only looking for specific files

551

# avoid the entire walk if we're only looking for specific files

552

if self._filesfastpath(match):

552

if self._filesfastpath(match):

553

for fn in sorted(fset):

553

for fn in sorted(fset):

554

if fn in self:

554

if fn in self:

555

yield fn

555

yield fn

556

return

556

return

557

558

for fn in self:

558

for fn in self:

559

if fn in fset:

559

if fn in fset:

560

# specified pattern is the exact name

560

# specified pattern is the exact name

561

fset.remove(fn)

561

fset.remove(fn)

562

if match(fn):

562

if match(fn):

563

yield fn

563

yield fn

564

565

# for dirstate.walk, files=[''] means "walk the whole tree".

565

# for dirstate.walk, files=[''] means "walk the whole tree".

566

# follow that here, too

566

# follow that here, too

567

fset.discard(b'')

567

fset.discard(b'')

568

569

for fn in sorted(fset):

569

for fn in sorted(fset):

570

if not self.hasdir(fn):

570

if not self.hasdir(fn):

571

match.bad(fn, None)

571

match.bad(fn, None)

572

573

def _matches(self, match):

573

def _matches(self, match):

574

'''generate a new manifest filtered by the match argument'''

574

'''generate a new manifest filtered by the match argument'''

575

if match.always():

575

if match.always():

576

return self.copy()

576

return self.copy()

577

578

if self._filesfastpath(match):

578

if self._filesfastpath(match):

579

m = manifestdict()

579

m = manifestdict()

580

lm = self._lm

580

lm = self._lm

581

for fn in match.files():

581

for fn in match.files():

582

if fn in lm:

582

if fn in lm:

583

m._lm[fn] = lm[fn]

583

m._lm[fn] = lm[fn]

584

return m

584

return m

585

586

m = manifestdict()

586

m = manifestdict()

587

m._lm = self._lm.filtercopy(match)

587

m._lm = self._lm.filtercopy(match)

588

return m

588

return m

589

590

def diff(self, m2, match=None, clean=False):

590

def diff(self, m2, match=None, clean=False):

591

'''Finds changes between the current manifest and m2.

591

'''Finds changes between the current manifest and m2.

592

593

Args:

593

Args:

594

m2: the manifest to which this manifest should be compared.

594

m2: the manifest to which this manifest should be compared.

595

clean: if true, include files unchanged between these manifests

595

clean: if true, include files unchanged between these manifests

596

with a None value in the returned dictionary.

596

with a None value in the returned dictionary.

597

598

The result is returned as a dict with filename as key and

598

The result is returned as a dict with filename as key and

599

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

599

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

600

nodeid in the current/other manifest and fl1/fl2 is the flag

600

nodeid in the current/other manifest and fl1/fl2 is the flag

601

in the current/other manifest. Where the file does not exist,

601

in the current/other manifest. Where the file does not exist,

602

the nodeid will be None and the flags will be the empty

602

the nodeid will be None and the flags will be the empty

603

string.

603

string.

604

'''

604

'''

605

if match:

605

if match:

606

m1 = self._matches(match)

606

m1 = self._matches(match)

607

m2 = m2._matches(match)

607

m2 = m2._matches(match)

608

return m1.diff(m2, clean=clean)

608

return m1.diff(m2, clean=clean)

609

return self._lm.diff(m2._lm, clean)

609

return self._lm.diff(m2._lm, clean)

610

611

def setflag(self, key, flag):

611

def setflag(self, key, flag):

612

self._lm[key] = self[key], flag

612

self._lm[key] = self[key], flag

613

614

def get(self, key, default=None):

614

def get(self, key, default=None):

615

try:

615

try:

616

return self._lm[key][0]

616

return self._lm[key][0]

617

except KeyError:

617

except KeyError:

618

return default

618

return default

619

620

def flags(self, key):

620

def flags(self, key):

621

try:

621

try:

622

return self._lm[key][1]

622

return self._lm[key][1]

623

except KeyError:

623

except KeyError:

624

return b''

624

return b''

625

626

def copy(self):

626

def copy(self):

627

c = manifestdict()

627

c = manifestdict()

628

c._lm = self._lm.copy()

628

c._lm = self._lm.copy()

629

return c

629

return c

630

631

def items(self):

631

def items(self):

632

return (x[:2] for x in self._lm.iterentries())

632

return (x[:2] for x in self._lm.iterentries())

633

634

def iteritems(self):

634

def iteritems(self):

635

return (x[:2] for x in self._lm.iterentries())

635

return (x[:2] for x in self._lm.iterentries())

636

637

def iterentries(self):

637

def iterentries(self):

638

return self._lm.iterentries()

638

return self._lm.iterentries()

639

640

def text(self):

640

def text(self):

641

# most likely uses native version

641

# most likely uses native version

642

return self._lm.text()

642

return self._lm.text()

643

644

def fastdelta(self, base, changes):

644

def fastdelta(self, base, changes):

645

"""Given a base manifest text as a bytearray and a list of changes

645

"""Given a base manifest text as a bytearray and a list of changes

646

relative to that text, compute a delta that can be used by revlog.

646

relative to that text, compute a delta that can be used by revlog.

647

"""

647

"""

648

delta = []

648

delta = []

649

dstart = None

649

dstart = None

650

dend = None

650

dend = None

651

dline = [b""]

651

dline = [b""]

652

start = 0

652

start = 0

653

# zero copy representation of base as a buffer

653

# zero copy representation of base as a buffer

654

addbuf = util.buffer(base)

654

addbuf = util.buffer(base)

655

656

changes = list(changes)

656

changes = list(changes)

657

if len(changes) < FASTDELTA_TEXTDIFF_THRESHOLD:

657

if len(changes) < FASTDELTA_TEXTDIFF_THRESHOLD:

658

# start with a readonly loop that finds the offset of

658

# start with a readonly loop that finds the offset of

659

# each line and creates the deltas

659

# each line and creates the deltas

660

for f, todelete in changes:

660

for f, todelete in changes:

661

# bs will either be the index of the item or the insert point

661

# bs will either be the index of the item or the insert point

662

start, end = _msearch(addbuf, f, start)

662

start, end = _msearch(addbuf, f, start)

663

if not todelete:

663

if not todelete:

664

h, fl = self._lm[f]

664

h, fl = self._lm[f]

665

l = b"%s\0%s%s\n" % (f, hex(h), fl)

665

l = b"%s\0%s%s\n" % (f, hex(h), fl)

666

else:

666

else:

667

if start == end:

667

if start == end:

668

# item we want to delete was not found, error out

668

# item we want to delete was not found, error out

669

raise AssertionError(

669

raise AssertionError(

670

_(b"failed to remove %s from manifest") % f

670

_(b"failed to remove %s from manifest") % f

671

)

671

)

672

l = b""

672

l = b""

673

if dstart is not None and dstart <= start and dend >= start:

673

if dstart is not None and dstart <= start and dend >= start:

674

if dend < end:

674

if dend < end:

675

dend = end

675

dend = end

676

if l:

676

if l:

677

dline.append(l)

677

dline.append(l)

678

else:

678

else:

679

if dstart is not None:

679

if dstart is not None:

680

delta.append([dstart, dend, b"".join(dline)])

680

delta.append([dstart, dend, b"".join(dline)])

681

dstart = start

681

dstart = start

682

dend = end

682

dend = end

683

dline = [l]

683

dline = [l]

684

685

if dstart is not None:

685

if dstart is not None:

686

delta.append([dstart, dend, b"".join(dline)])

686

delta.append([dstart, dend, b"".join(dline)])

687

# apply the delta to the base, and get a delta for addrevision

687

# apply the delta to the base, and get a delta for addrevision

688

deltatext, arraytext = _addlistdelta(base, delta)

688

deltatext, arraytext = _addlistdelta(base, delta)

689

else:

689

else:

690

# For large changes, it's much cheaper to just build the text and

690

# For large changes, it's much cheaper to just build the text and

691

# diff it.

691

# diff it.

692

arraytext = bytearray(self.text())

692

arraytext = bytearray(self.text())

693

deltatext = mdiff.textdiff(

693

deltatext = mdiff.textdiff(

694

util.buffer(base), util.buffer(arraytext)

694

util.buffer(base), util.buffer(arraytext)

695

)

695

)

696

697

return arraytext, deltatext

697

return arraytext, deltatext

698

699

700

def _msearch(m, s, lo=0, hi=None):

700

def _msearch(m, s, lo=0, hi=None):

701

'''return a tuple (start, end) that says where to find s within m.

701

'''return a tuple (start, end) that says where to find s within m.

702

703

If the string is found m[start:end] are the line containing

703

If the string is found m[start:end] are the line containing

704

that string. If start == end the string was not found and

704

that string. If start == end the string was not found and

705

they indicate the proper sorted insertion point.

705

they indicate the proper sorted insertion point.

706

707

m should be a buffer, a memoryview or a byte string.

707

m should be a buffer, a memoryview or a byte string.

708

s is a byte string'''

708

s is a byte string'''

709

710

def advance(i, c):

710

def advance(i, c):

711

while i < lenm and m[i : i + 1] != c:

711

while i < lenm and m[i : i + 1] != c:

712

i += 1

712

i += 1

713

return i

713

return i

714

715

if not s:

715

if not s:

716

return (lo, lo)

716

return (lo, lo)

717

lenm = len(m)

717

lenm = len(m)

718

if not hi:

718

if not hi:

719

hi = lenm

719

hi = lenm

720

while lo < hi:

720

while lo < hi:

721

mid = (lo + hi) // 2

721

mid = (lo + hi) // 2

722

start = mid

722

start = mid

723

while start > 0 and m[start - 1 : start] != b'\n':

723

while start > 0 and m[start - 1 : start] != b'\n':

724

start -= 1

724

start -= 1

725

end = advance(start, b'\0')

725

end = advance(start, b'\0')

726

if bytes(m[start:end]) < s:

726

if bytes(m[start:end]) < s:

727

# we know that after the null there are 40 bytes of sha1

727

# we know that after the null there are 40 bytes of sha1

728

# this translates to the bisect lo = mid + 1

728

# this translates to the bisect lo = mid + 1

729

lo = advance(end + 40, b'\n') + 1

729

lo = advance(end + 40, b'\n') + 1

730

else:

730

else:

731

# this translates to the bisect hi = mid

731

# this translates to the bisect hi = mid

732

hi = start

732

hi = start

733

end = advance(lo, b'\0')

733

end = advance(lo, b'\0')

734

found = m[lo:end]

734

found = m[lo:end]

735

if s == found:

735

if s == found:

736

# we know that after the null there are 40 bytes of sha1

736

# we know that after the null there are 40 bytes of sha1

737

end = advance(end + 40, b'\n')

737

end = advance(end + 40, b'\n')

738

return (lo, end + 1)

738

return (lo, end + 1)

739

else:

739

else:

740

return (lo, lo)

740

return (lo, lo)

741

742

743

def _checkforbidden(l):

743

def _checkforbidden(l):

744

"""Check filenames for illegal characters."""

744

"""Check filenames for illegal characters."""

745

for f in l:

745

for f in l:

746

if b'\n' in f or b'\r' in f:

746

if b'\n' in f or b'\r' in f:

747

raise error.StorageError(

747

raise error.StorageError(

748

_(b"'\\n' and '\\r' disallowed in filenames: %r")

748

_(b"'\\n' and '\\r' disallowed in filenames: %r")

749

% pycompat.bytestr(f)

749

% pycompat.bytestr(f)

750

)

750

)

751

752

753

# apply the changes collected during the bisect loop to our addlist

753

# apply the changes collected during the bisect loop to our addlist

754

# return a delta suitable for addrevision

754

# return a delta suitable for addrevision

755

def _addlistdelta(addlist, x):

755

def _addlistdelta(addlist, x):

756

# for large addlist arrays, building a new array is cheaper

756

# for large addlist arrays, building a new array is cheaper

757

# than repeatedly modifying the existing one

757

# than repeatedly modifying the existing one

758

currentposition = 0

758

currentposition = 0

759

newaddlist = bytearray()

759

newaddlist = bytearray()

760

761

for start, end, content in x:

761

for start, end, content in x:

762

newaddlist += addlist[currentposition:start]

762

newaddlist += addlist[currentposition:start]

763

if content:

763

if content:

764

newaddlist += bytearray(content)

764

newaddlist += bytearray(content)

765

766

currentposition = end

766

currentposition = end

767

768

newaddlist += addlist[currentposition:]

768

newaddlist += addlist[currentposition:]

769

770

deltatext = b"".join(

770

deltatext = b"".join(

771

struct.pack(b">lll", start, end, len(content)) + content

771

struct.pack(b">lll", start, end, len(content)) + content

772

for start, end, content in x

772

for start, end, content in x

773

)

773

)

774

return deltatext, newaddlist

774

return deltatext, newaddlist

775

776

777

def _splittopdir(f):

777

def _splittopdir(f):

778

if b'/' in f:

778

if b'/' in f:

779

dir, subpath = f.split(b'/', 1)

779

dir, subpath = f.split(b'/', 1)

780

return dir + b'/', subpath

780

return dir + b'/', subpath

781

else:

781

else:

782

return b'', f

782

return b'', f

783

784

785

_noop = lambda s: None

785

_noop = lambda s: None

786

787

788

@interfaceutil.implementer(repository.imanifestdict)

788

@interfaceutil.implementer(repository.imanifestdict)

789

class treemanifest(object):

789

class treemanifest(object):

790

def __init__(self, dir=b'', text=b''):

790

def __init__(self, dir=b'', text=b''):

791

self._dir = dir

791

self._dir = dir

792

self._node = nullid

792

self._node = nullid

793

self._loadfunc = _noop

793

self._loadfunc = _noop

794

self._copyfunc = _noop

794

self._copyfunc = _noop

795

self._dirty = False

795

self._dirty = False

796

self._dirs = {}

796

self._dirs = {}

797

self._lazydirs = {}

797

self._lazydirs = {}

798

# Using _lazymanifest here is a little slower than plain old dicts

798

# Using _lazymanifest here is a little slower than plain old dicts

799

self._files = {}

799

self._files = {}

800

self._flags = {}

800

self._flags = {}

801

if text:

801

if text:

802

803

def readsubtree(subdir, subm):

803

def readsubtree(subdir, subm):

804

raise AssertionError(

804

raise AssertionError(

805

b'treemanifest constructor only accepts flat manifests'

805

b'treemanifest constructor only accepts flat manifests'

806

)

806

)

807

808

self.parse(text, readsubtree)

808

self.parse(text, readsubtree)

809

self._dirty = True # Mark flat manifest dirty after parsing

809

self._dirty = True # Mark flat manifest dirty after parsing

810

811

def _subpath(self, path):

811

def _subpath(self, path):

812

return self._dir + path

812

return self._dir + path

813

814

def _loadalllazy(self):

814

def _loadalllazy(self):

815

selfdirs = self._dirs

815

selfdirs = self._dirs

816

for d, (path, node, readsubtree, docopy) in pycompat.iteritems(

816

for d, (path, node, readsubtree, docopy) in pycompat.iteritems(

817

self._lazydirs

817

self._lazydirs

818

):

818

):

819

if docopy:

819

if docopy:

820

selfdirs[d] = readsubtree(path, node).copy()

820

selfdirs[d] = readsubtree(path, node).copy()

821

else:

821

else:

822

selfdirs[d] = readsubtree(path, node)

822

selfdirs[d] = readsubtree(path, node)

823

self._lazydirs = {}

823

self._lazydirs = {}

824

825

def _loadlazy(self, d):

825

def _loadlazy(self, d):

826

v = self._lazydirs.get(d)

826

v = self._lazydirs.get(d)

827

if v:

827

if v:

828

path, node, readsubtree, docopy = v

828

path, node, readsubtree, docopy = v

829

if docopy:

829

if docopy:

830

self._dirs[d] = readsubtree(path, node).copy()

830

self._dirs[d] = readsubtree(path, node).copy()

831

else:

831

else:

832

self._dirs[d] = readsubtree(path, node)

832

self._dirs[d] = readsubtree(path, node)

833

del self._lazydirs[d]

833

del self._lazydirs[d]

834

835

def _loadchildrensetlazy(self, visit):

835

def _loadchildrensetlazy(self, visit):

836

if not visit:

836

if not visit:

837

return None

837

return None

838

if visit == b'all' or visit == b'this':

838

if visit == b'all' or visit == b'this':

839

self._loadalllazy()

839

self._loadalllazy()

840

return None

840

return None

841

842

loadlazy = self._loadlazy

842

loadlazy = self._loadlazy

843

for k in visit:

843

for k in visit:

844

loadlazy(k + b'/')

844

loadlazy(k + b'/')

845

return visit

845

return visit

846

847

def _loaddifflazy(self, t1, t2):

847

def _loaddifflazy(self, t1, t2):

848

"""load items in t1 and t2 if they're needed for diffing.

848

"""load items in t1 and t2 if they're needed for diffing.

849

850

The criteria currently is:

850

The criteria currently is:

851

- if it's not present in _lazydirs in either t1 or t2, load it in the

851

- if it's not present in _lazydirs in either t1 or t2, load it in the

852

other (it may already be loaded or it may not exist, doesn't matter)

852

other (it may already be loaded or it may not exist, doesn't matter)

853

- if it's present in _lazydirs in both, compare the nodeid; if it

853

- if it's present in _lazydirs in both, compare the nodeid; if it

854

differs, load it in both

854

differs, load it in both

855

"""

855

"""

856

toloadlazy = []

856

toloadlazy = []

857

for d, v1 in pycompat.iteritems(t1._lazydirs):

857

for d, v1 in pycompat.iteritems(t1._lazydirs):

858

v2 = t2._lazydirs.get(d)

858

v2 = t2._lazydirs.get(d)

859

if not v2 or v2[1] != v1[1]:

859

if not v2 or v2[1] != v1[1]:

860

toloadlazy.append(d)

860

toloadlazy.append(d)

861

for d, v1 in pycompat.iteritems(t2._lazydirs):

861

for d, v1 in pycompat.iteritems(t2._lazydirs):

862

if d not in t1._lazydirs:

862

if d not in t1._lazydirs:

863

toloadlazy.append(d)

863

toloadlazy.append(d)

864

865

for d in toloadlazy:

865

for d in toloadlazy:

866

t1._loadlazy(d)

866

t1._loadlazy(d)

867

t2._loadlazy(d)

867

t2._loadlazy(d)

868

869

def __len__(self):

869

def __len__(self):

870

self._load()

870

self._load()

871

size = len(self._files)

871

size = len(self._files)

872

self._loadalllazy()

872

self._loadalllazy()

873

for m in self._dirs.values():

873

for m in self._dirs.values():

874

size += m.__len__()

874

size += m.__len__()

875

return size

875

return size

876

877

def __nonzero__(self):

877

def __nonzero__(self):

878

# Faster than "__len() != 0" since it avoids loading sub-manifests

878

# Faster than "__len() != 0" since it avoids loading sub-manifests

879

return not self._isempty()

879

return not self._isempty()

880

881

__bool__ = __nonzero__

881

__bool__ = __nonzero__

882

883

def _isempty(self):

883

def _isempty(self):

884

self._load() # for consistency; already loaded by all callers

884

self._load() # for consistency; already loaded by all callers

885

# See if we can skip loading everything.

885

# See if we can skip loading everything.

886

if self._files or (

886

if self._files or (

887

self._dirs and any(not m._isempty() for m in self._dirs.values())

887

self._dirs and any(not m._isempty() for m in self._dirs.values())

888

):

888

):

889

return False

889

return False

890

self._loadalllazy()

890

self._loadalllazy()

891

return not self._dirs or all(m._isempty() for m in self._dirs.values())

891

return not self._dirs or all(m._isempty() for m in self._dirs.values())

892

893

@encoding.strmethod

893

@encoding.strmethod

894

def __repr__(self):

894

def __repr__(self):

895

return (

895

return (

896

b'<treemanifest dir=%s, node=%s, loaded=%r, dirty=%r at 0x%x>'

896

b'<treemanifest dir=%s, node=%s, loaded=%r, dirty=%r at 0x%x>'

897

% (

897

% (

898

self._dir,

898

self._dir,

899

hex(self._node),

899

hex(self._node),

900

bool(self._loadfunc is _noop),

900

bool(self._loadfunc is _noop),

901

self._dirty,

901

self._dirty,

902

id(self),

902

id(self),

903

)

903

)

904

)

904

)

905

906

def dir(self):

906

def dir(self):

907

'''The directory that this tree manifest represents, including a

907

'''The directory that this tree manifest represents, including a

908

trailing '/'. Empty string for the repo root directory.'''

908

trailing '/'. Empty string for the repo root directory.'''

909

return self._dir

909

return self._dir

910

911

def node(self):

911

def node(self):

912

'''This node of this instance. nullid for unsaved instances. Should

912

'''This node of this instance. nullid for unsaved instances. Should

913

be updated when the instance is read or written from a revlog.

913

be updated when the instance is read or written from a revlog.

914

'''

914

'''

915

assert not self._dirty

915

assert not self._dirty

916

return self._node

916

return self._node

917

918

def setnode(self, node):

918

def setnode(self, node):

919

self._node = node

919

self._node = node

920

self._dirty = False

920

self._dirty = False

921

922

def iterentries(self):

922

def iterentries(self):

923

self._load()

923

self._load()

924

self._loadalllazy()

924

self._loadalllazy()

925

for p, n in sorted(

925

for p, n in sorted(

926

itertools.chain(self._dirs.items(), self._files.items())

926

itertools.chain(self._dirs.items(), self._files.items())

927

):

927

):

928

if p in self._files:

928

if p in self._files:

929

yield self._subpath(p), n, self._flags.get(p, b'')

929

yield self._subpath(p), n, self._flags.get(p, b'')

930

else:

930

else:

931

for x in n.iterentries():

931

for x in n.iterentries():

932

yield x

932

yield x

933

934

def items(self):

934

def items(self):

935

self._load()

935

self._load()

936

self._loadalllazy()

936

self._loadalllazy()

937

for p, n in sorted(

937

for p, n in sorted(

938

itertools.chain(self._dirs.items(), self._files.items())

938

itertools.chain(self._dirs.items(), self._files.items())

939

):

939

):

940

if p in self._files:

940

if p in self._files:

941

yield self._subpath(p), n

941

yield self._subpath(p), n

942

else:

942

else:

943

for f, sn in pycompat.iteritems(n):

943

for f, sn in pycompat.iteritems(n):

944

yield f, sn

944

yield f, sn

945

946

iteritems = items

946

iteritems = items

947

948

def iterkeys(self):

948

def iterkeys(self):

949

self._load()

949

self._load()

950

self._loadalllazy()

950

self._loadalllazy()

951

for p in sorted(itertools.chain(self._dirs, self._files)):

951

for p in sorted(itertools.chain(self._dirs, self._files)):

952

if p in self._files:

952

if p in self._files:

953

yield self._subpath(p)

953

yield self._subpath(p)

954

else:

954

else:

955

for f in self._dirs[p]:

955

for f in self._dirs[p]:

956

yield f

956

yield f

957

958

def keys(self):

958

def keys(self):

959

return list(self.iterkeys())

959

return list(self.iterkeys())

960

961

def __iter__(self):

961

def __iter__(self):

962

return self.iterkeys()

962

return self.iterkeys()

963

964

def __contains__(self, f):

964

def __contains__(self, f):

965

if f is None:

965

if f is None:

966

return False

966

return False

967

self._load()

967

self._load()

968

dir, subpath = _splittopdir(f)

968

dir, subpath = _splittopdir(f)

969

if dir:

969

if dir:

970

self._loadlazy(dir)

970

self._loadlazy(dir)

971

972

if dir not in self._dirs:

972

if dir not in self._dirs:

973

return False

973

return False

974

975

return self._dirs[dir].__contains__(subpath)

975

return self._dirs[dir].__contains__(subpath)

976

else:

976

else:

977

return f in self._files

977

return f in self._files

978

979

def get(self, f, default=None):

979

def get(self, f, default=None):

980

self._load()

980

self._load()

981

dir, subpath = _splittopdir(f)

981

dir, subpath = _splittopdir(f)

982

if dir:

982

if dir:

983

self._loadlazy(dir)

983

self._loadlazy(dir)

984

985

if dir not in self._dirs:

985

if dir not in self._dirs:

986

return default

986

return default

987

return self._dirs[dir].get(subpath, default)

987

return self._dirs[dir].get(subpath, default)

988

else:

988

else:

989

return self._files.get(f, default)

989

return self._files.get(f, default)

990

991

def __getitem__(self, f):

991

def __getitem__(self, f):

992

self._load()

992

self._load()

993

dir, subpath = _splittopdir(f)

993

dir, subpath = _splittopdir(f)

994

if dir:

994

if dir:

995

self._loadlazy(dir)

995

self._loadlazy(dir)

996

997

return self._dirs[dir].__getitem__(subpath)

997

return self._dirs[dir].__getitem__(subpath)

998

else:

998

else:

999

return self._files[f]

999

return self._files[f]

1000

1001

def flags(self, f):

1001

def flags(self, f):

1002

self._load()

1002

self._load()

1003

dir, subpath = _splittopdir(f)

1003

dir, subpath = _splittopdir(f)

1004

if dir:

1004

if dir:

1005

self._loadlazy(dir)

1005

self._loadlazy(dir)

1006

1007

if dir not in self._dirs:

1007

if dir not in self._dirs:

1008

return b''

1008

return b''

1009

return self._dirs[dir].flags(subpath)

1009

return self._dirs[dir].flags(subpath)

1010

else:

1010

else:

1011

if f in self._lazydirs or f in self._dirs:

1011

if f in self._lazydirs or f in self._dirs:

1012

return b''

1012

return b''

1013

return self._flags.get(f, b'')

1013

return self._flags.get(f, b'')

1014

1015

def find(self, f):

1015

def find(self, f):

1016

self._load()

1016

self._load()

1017

dir, subpath = _splittopdir(f)

1017

dir, subpath = _splittopdir(f)

1018

if dir:

1018

if dir:

1019

self._loadlazy(dir)

1019

self._loadlazy(dir)

1020

1021

return self._dirs[dir].find(subpath)

1021

return self._dirs[dir].find(subpath)

1022

else:

1022

else:

1023

return self._files[f], self._flags.get(f, b'')

1023

return self._files[f], self._flags.get(f, b'')

1024

1025

def __delitem__(self, f):

1025

def __delitem__(self, f):

1026

self._load()

1026

self._load()

1027

dir, subpath = _splittopdir(f)

1027

dir, subpath = _splittopdir(f)

1028

if dir:

1028

if dir:

1029

self._loadlazy(dir)

1029

self._loadlazy(dir)

1030

1031

self._dirs[dir].__delitem__(subpath)

1031

self._dirs[dir].__delitem__(subpath)

1032

# If the directory is now empty, remove it

1032

# If the directory is now empty, remove it

1033

if self._dirs[dir]._isempty():

1033

if self._dirs[dir]._isempty():

1034

del self._dirs[dir]

1034

del self._dirs[dir]

1035

else:

1035

else:

1036

del self._files[f]

1036

del self._files[f]

1037

if f in self._flags:

1037

if f in self._flags:

1038

del self._flags[f]

1038

del self._flags[f]

1039

self._dirty = True

1039

self._dirty = True

1040

1041

def __setitem__(self, f, n):

1041

def __setitem__(self, f, n):

1042

assert n is not None

1042

assert n is not None

1043

self._load()

1043

self._load()

1044

dir, subpath = _splittopdir(f)

1044

dir, subpath = _splittopdir(f)

1045

if dir:

1045

if dir:

1046

self._loadlazy(dir)

1046

self._loadlazy(dir)

1047

if dir not in self._dirs:

1047

if dir not in self._dirs:

1048

self._dirs[dir] = treemanifest(self._subpath(dir))

1048

self._dirs[dir] = treemanifest(self._subpath(dir))

1049

self._dirs[dir].__setitem__(subpath, n)

1049

self._dirs[dir].__setitem__(subpath, n)

1050

else:

1050

else:

1051

# manifest nodes are either 20 bytes or 32 bytes,

1051

# manifest nodes are either 20 bytes or 32 bytes,

1052

# depending on the hash in use. An extra byte is

1052

# depending on the hash in use. An extra byte is

1053

# occasionally used by hg, but won't ever be

1053

# occasionally used by hg, but won't ever be

1054

# persisted. Trim to 21 or 33 bytes as appropriate.

1054

# persisted. Trim to 21 or 33 bytes as appropriate.

1055

trim = 21 if len(n) < 25 else 33

1055

trim = 21 if len(n) < 25 else 33

1056

self._files[f] = n[:trim] # to match manifestdict's behavior

1056

self._files[f] = n[:trim] # to match manifestdict's behavior

1057

self._dirty = True

1057

self._dirty = True

1058

1059

def _load(self):

1059

def _load(self):

1060

if self._loadfunc is not _noop:

1060

if self._loadfunc is not _noop:

1061

lf, self._loadfunc = self._loadfunc, _noop

1061

lf, self._loadfunc = self._loadfunc, _noop

1062

lf(self)

1062

lf(self)

1063

elif self._copyfunc is not _noop:

1063

elif self._copyfunc is not _noop:

1064

cf, self._copyfunc = self._copyfunc, _noop

1064

cf, self._copyfunc = self._copyfunc, _noop

1065

cf(self)

1065

cf(self)

1066

1067

def setflag(self, f, flags):

1067

def setflag(self, f, flags):

1068

"""Set the flags (symlink, executable) for path f."""

1068

"""Set the flags (symlink, executable) for path f."""

1069

self._load()

1069

self._load()

1070

dir, subpath = _splittopdir(f)

1070

dir, subpath = _splittopdir(f)

1071

if dir:

1071

if dir:

1072

self._loadlazy(dir)

1072

self._loadlazy(dir)

1073

if dir not in self._dirs:

1073

if dir not in self._dirs:

1074

self._dirs[dir] = treemanifest(self._subpath(dir))

1074

self._dirs[dir] = treemanifest(self._subpath(dir))

1075

self._dirs[dir].setflag(subpath, flags)

1075

self._dirs[dir].setflag(subpath, flags)

1076

else:

1076

else:

1077

self._flags[f] = flags

1077

self._flags[f] = flags

1078

self._dirty = True

1078

self._dirty = True

1079

1080

def copy(self):

1080

def copy(self):

1081

copy = treemanifest(self._dir)

1081

copy = treemanifest(self._dir)

1082

copy._node = self._node

1082

copy._node = self._node

1083

copy._dirty = self._dirty

1083

copy._dirty = self._dirty

1084

if self._copyfunc is _noop:

1084

if self._copyfunc is _noop:

1085

1086

def _copyfunc(s):

1086

def _copyfunc(s):

1087

self._load()

1087

self._load()

1088

s._lazydirs = {

1088

s._lazydirs = {

1089

d: (p, n, r, True)

1089

d: (p, n, r, True)

1090

for d, (p, n, r, c) in pycompat.iteritems(self._lazydirs)

1090

for d, (p, n, r, c) in pycompat.iteritems(self._lazydirs)

1091

}

1091

}

1092

sdirs = s._dirs

1092

sdirs = s._dirs

1093

for d, v in pycompat.iteritems(self._dirs):

1093

for d, v in pycompat.iteritems(self._dirs):

1094

sdirs[d] = v.copy()

1094

sdirs[d] = v.copy()

1095

s._files = dict.copy(self._files)

1095

s._files = dict.copy(self._files)

1096

s._flags = dict.copy(self._flags)

1096

s._flags = dict.copy(self._flags)

1097

1098

if self._loadfunc is _noop:

1098

if self._loadfunc is _noop:

1099

_copyfunc(copy)

1099

_copyfunc(copy)

1100

else:

1100

else:

1101

copy._copyfunc = _copyfunc

1101

copy._copyfunc = _copyfunc

1102

else:

1102

else:

1103

copy._copyfunc = self._copyfunc

1103

copy._copyfunc = self._copyfunc

1104

return copy

1104

return copy

1105

1106

def filesnotin(self, m2, match=None):

1106

def filesnotin(self, m2, match=None):

1107

'''Set of files in this manifest that are not in the other'''

1107

'''Set of files in this manifest that are not in the other'''

1108

if match and not match.always():

1108

if match and not match.always():

1109

m1 = self._matches(match)

1109

m1 = self._matches(match)

1110

m2 = m2._matches(match)

1110

m2 = m2._matches(match)

1111

return m1.filesnotin(m2)

1111

return m1.filesnotin(m2)

1112

1113

files = set()

1113

files = set()

1114

1115

def _filesnotin(t1, t2):

1115

def _filesnotin(t1, t2):

1116

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1116

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1117

return

1117

return

1118

t1._load()

1118

t1._load()

1119

t2._load()

1119

t2._load()

1120

self._loaddifflazy(t1, t2)

1120

self._loaddifflazy(t1, t2)

1121

for d, m1 in pycompat.iteritems(t1._dirs):

1121

for d, m1 in pycompat.iteritems(t1._dirs):

1122

if d in t2._dirs:

1122

if d in t2._dirs:

1123

m2 = t2._dirs[d]

1123

m2 = t2._dirs[d]

1124

_filesnotin(m1, m2)

1124

_filesnotin(m1, m2)

1125

else:

1125

else:

1126

files.update(m1.iterkeys())

1126

files.update(m1.iterkeys())

1127

1128

for fn in t1._files:

1128

for fn in t1._files:

1129

if fn not in t2._files:

1129

if fn not in t2._files:

1130

files.add(t1._subpath(fn))

1130

files.add(t1._subpath(fn))

1131

1132

_filesnotin(self, m2)

1132

_filesnotin(self, m2)

1133

return files

1133

return files

1134

1135

@propertycache

1135

@propertycache

1136

def _alldirs(self):

1136

def _alldirs(self):

1137

return pathutil.dirs(self)

1137

return pathutil.dirs(self)

1138

1139

def dirs(self):

1139

def dirs(self):

1140

return self._alldirs

1140

return self._alldirs

1141

1142

def hasdir(self, dir):

1142

def hasdir(self, dir):

1143

self._load()

1143

self._load()

1144

topdir, subdir = _splittopdir(dir)

1144

topdir, subdir = _splittopdir(dir)

1145

if topdir:

1145

if topdir:

1146

self._loadlazy(topdir)

1146

self._loadlazy(topdir)

1147

if topdir in self._dirs:

1147

if topdir in self._dirs:

1148

return self._dirs[topdir].hasdir(subdir)

1148

return self._dirs[topdir].hasdir(subdir)

1149

return False

1149

return False

1150

dirslash = dir + b'/'

1150

dirslash = dir + b'/'

1151

return dirslash in self._dirs or dirslash in self._lazydirs

1151

return dirslash in self._dirs or dirslash in self._lazydirs

1152

1153

def walk(self, match):

1153

def walk(self, match):

1154

'''Generates matching file names.

1154

'''Generates matching file names.

1155

1156

It also reports nonexistent files by marking them bad with match.bad().

1156

It also reports nonexistent files by marking them bad with match.bad().

1157

'''

1157

'''

1158

if match.always():

1158

if match.always():

1159

for f in iter(self):

1159

for f in iter(self):

1160

yield f

1160

yield f

1161

return

1161

return

1162

1163

fset = set(match.files())

1163

fset = set(match.files())

1164

1165

for fn in self._walk(match):

1165

for fn in self._walk(match):

1166

if fn in fset:

1166

if fn in fset:

1167

# specified pattern is the exact name

1167

# specified pattern is the exact name

1168

fset.remove(fn)

1168

fset.remove(fn)

1169

yield fn

1169

yield fn

1170

1171

# for dirstate.walk, files=[''] means "walk the whole tree".

1171

# for dirstate.walk, files=[''] means "walk the whole tree".

1172

# follow that here, too

1172

# follow that here, too

1173

fset.discard(b'')

1173

fset.discard(b'')

1174

1175

for fn in sorted(fset):

1175

for fn in sorted(fset):

1176

if not self.hasdir(fn):

1176

if not self.hasdir(fn):

1177

match.bad(fn, None)

1177

match.bad(fn, None)

1178

1179

def _walk(self, match):

1179

def _walk(self, match):

1180

'''Recursively generates matching file names for walk().'''

1180

'''Recursively generates matching file names for walk().'''

1181

visit = match.visitchildrenset(self._dir[:-1])

1181

visit = match.visitchildrenset(self._dir[:-1])

1182

if not visit:

1182

if not visit:

1183

return

1183

return

1184

1185

# yield this dir's files and walk its submanifests

1185

# yield this dir's files and walk its submanifests

1186

self._load()

1186

self._load()

1187

visit = self._loadchildrensetlazy(visit)

1187

visit = self._loadchildrensetlazy(visit)

1188

for p in sorted(list(self._dirs) + list(self._files)):

1188

for p in sorted(list(self._dirs) + list(self._files)):

1189

if p in self._files:

1189

if p in self._files:

1190

fullp = self._subpath(p)

1190

fullp = self._subpath(p)

1191

if match(fullp):

1191

if match(fullp):

1192

yield fullp

1192

yield fullp

1193

else:

1193

else:

1194

if not visit or p[:-1] in visit:

1194

if not visit or p[:-1] in visit:

1195

for f in self._dirs[p]._walk(match):

1195

for f in self._dirs[p]._walk(match):

1196

yield f

1196

yield f

1197

1198

def _matches(self, match):

1198

def _matches(self, match):

1199

'''recursively generate a new manifest filtered by the match argument.

1199

'''recursively generate a new manifest filtered by the match argument.

1200

'''

1200

'''

1201

if match.always():

1201

if match.always():

1202

return self.copy()

1202

return self.copy()

1203

return self._matches_inner(match)

1203

return self._matches_inner(match)

1204

1205

def _matches_inner(self, match):

1205

def _matches_inner(self, match):

1206

if match.always():

1206

if match.always():

1207

return self.copy()

1207

return self.copy()

1208

1209

visit = match.visitchildrenset(self._dir[:-1])

1209

visit = match.visitchildrenset(self._dir[:-1])

1210

if visit == b'all':

1210

if visit == b'all':

1211

return self.copy()

1211

return self.copy()

1212

ret = treemanifest(self._dir)

1212

ret = treemanifest(self._dir)

1213

if not visit:

1213

if not visit:

1214

return ret

1214

return ret

1215

1216

self._load()

1216

self._load()

1217

for fn in self._files:

1217

for fn in self._files:

1218

# While visitchildrenset *usually* lists only subdirs, this is

1218

# While visitchildrenset *usually* lists only subdirs, this is

1219

# actually up to the matcher and may have some files in the set().

1219

# actually up to the matcher and may have some files in the set().

1220

# If visit == 'this', we should obviously look at the files in this

1220

# If visit == 'this', we should obviously look at the files in this

1221

# directory; if visit is a set, and fn is in it, we should inspect

1221

# directory; if visit is a set, and fn is in it, we should inspect

1222

# fn (but no need to inspect things not in the set).

1222

# fn (but no need to inspect things not in the set).

1223

if visit != b'this' and fn not in visit:

1223

if visit != b'this' and fn not in visit:

1224

continue

1224

continue

1225

fullp = self._subpath(fn)

1225

fullp = self._subpath(fn)

1226

# visitchildrenset isn't perfect, we still need to call the regular

1226

# visitchildrenset isn't perfect, we still need to call the regular

1227

# matcher code to further filter results.

1227

# matcher code to further filter results.

1228

if not match(fullp):

1228

if not match(fullp):

1229

continue

1229

continue

1230

ret._files[fn] = self._files[fn]

1230

ret._files[fn] = self._files[fn]

1231

if fn in self._flags:

1231

if fn in self._flags:

1232

ret._flags[fn] = self._flags[fn]

1232

ret._flags[fn] = self._flags[fn]

1233

1234

visit = self._loadchildrensetlazy(visit)

1234

visit = self._loadchildrensetlazy(visit)

1235

for dir, subm in pycompat.iteritems(self._dirs):

1235

for dir, subm in pycompat.iteritems(self._dirs):

1236

if visit and dir[:-1] not in visit:

1236

if visit and dir[:-1] not in visit:

1237

continue

1237

continue

1238

m = subm._matches_inner(match)

1238

m = subm._matches_inner(match)

1239

if not m._isempty():

1239

if not m._isempty():

1240

ret._dirs[dir] = m

1240

ret._dirs[dir] = m

1241

1242

if not ret._isempty():

1242

if not ret._isempty():

1243

ret._dirty = True

1243

ret._dirty = True

1244

return ret

1244

return ret

1245

1246

def fastdelta(self, base, changes):

1246

def fastdelta(self, base, changes):

1247

raise FastdeltaUnavailable()

1247

raise FastdeltaUnavailable()

1248

1249

def diff(self, m2, match=None, clean=False):

1249

def diff(self, m2, match=None, clean=False):

1250

'''Finds changes between the current manifest and m2.

1250

'''Finds changes between the current manifest and m2.

1251

1252

Args:

1252

Args:

1253

m2: the manifest to which this manifest should be compared.

1253

m2: the manifest to which this manifest should be compared.

1254

clean: if true, include files unchanged between these manifests

1254

clean: if true, include files unchanged between these manifests

1255

with a None value in the returned dictionary.

1255

with a None value in the returned dictionary.

1256

1257

The result is returned as a dict with filename as key and

1257

The result is returned as a dict with filename as key and

1258

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

1258

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

1259

nodeid in the current/other manifest and fl1/fl2 is the flag

1259

nodeid in the current/other manifest and fl1/fl2 is the flag

1260

in the current/other manifest. Where the file does not exist,

1260

in the current/other manifest. Where the file does not exist,

1261

the nodeid will be None and the flags will be the empty

1261

the nodeid will be None and the flags will be the empty

1262

string.

1262

string.

1263

'''

1263

'''

1264

if match and not match.always():

1264

if match and not match.always():

1265

m1 = self._matches(match)

1265

m1 = self._matches(match)

1266

m2 = m2._matches(match)

1266

m2 = m2._matches(match)

1267

return m1.diff(m2, clean=clean)

1267

return m1.diff(m2, clean=clean)

1268

result = {}

1268

result = {}

1269

emptytree = treemanifest()

1269

emptytree = treemanifest()

1270

1271

def _iterativediff(t1, t2, stack):

1271

def _iterativediff(t1, t2, stack):

1272

"""compares two tree manifests and append new tree-manifests which

1272

"""compares two tree manifests and append new tree-manifests which

1273

needs to be compared to stack"""

1273

needs to be compared to stack"""

1274

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1274

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1275

return

1275

return

1276

t1._load()

1276

t1._load()

1277

t2._load()

1277

t2._load()

1278

self._loaddifflazy(t1, t2)

1278

self._loaddifflazy(t1, t2)

1279

1280

for d, m1 in pycompat.iteritems(t1._dirs):

1280

for d, m1 in pycompat.iteritems(t1._dirs):

1281

m2 = t2._dirs.get(d, emptytree)

1281

m2 = t2._dirs.get(d, emptytree)

1282

stack.append((m1, m2))

1282

stack.append((m1, m2))

1283

1284

for d, m2 in pycompat.iteritems(t2._dirs):

1284

for d, m2 in pycompat.iteritems(t2._dirs):

1285

if d not in t1._dirs:

1285

if d not in t1._dirs:

1286

stack.append((emptytree, m2))

1286

stack.append((emptytree, m2))

1287

1288

for fn, n1 in pycompat.iteritems(t1._files):

1288

for fn, n1 in pycompat.iteritems(t1._files):

1289

fl1 = t1._flags.get(fn, b'')

1289

fl1 = t1._flags.get(fn, b'')

1290

n2 = t2._files.get(fn, None)

1290

n2 = t2._files.get(fn, None)

1291

fl2 = t2._flags.get(fn, b'')

1291

fl2 = t2._flags.get(fn, b'')

1292

if n1 != n2 or fl1 != fl2:

1292

if n1 != n2 or fl1 != fl2:

1293

result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))

1293

result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))

1294

elif clean:

1294

elif clean:

1295

result[t1._subpath(fn)] = None

1295

result[t1._subpath(fn)] = None

1296

1297

for fn, n2 in pycompat.iteritems(t2._files):

1297

for fn, n2 in pycompat.iteritems(t2._files):

1298

if fn not in t1._files:

1298

if fn not in t1._files:

1299

fl2 = t2._flags.get(fn, b'')

1299

fl2 = t2._flags.get(fn, b'')

1300

result[t2._subpath(fn)] = ((None, b''), (n2, fl2))

1300

result[t2._subpath(fn)] = ((None, b''), (n2, fl2))

1301

1302

stackls = []

1302

stackls = []

1303

_iterativediff(self, m2, stackls)

1303

_iterativediff(self, m2, stackls)

1304

while stackls:

1304

while stackls:

1305

t1, t2 = stackls.pop()

1305

t1, t2 = stackls.pop()

1306

# stackls is populated in the function call

1306

# stackls is populated in the function call

1307

_iterativediff(t1, t2, stackls)

1307

_iterativediff(t1, t2, stackls)

1308

return result

1308

return result

1309

1310

def unmodifiedsince(self, m2):

1310

def unmodifiedsince(self, m2):

1311

return not self._dirty and not m2._dirty and self._node == m2._node

1311

return not self._dirty and not m2._dirty and self._node == m2._node

1312

1313

def parse(self, text, readsubtree):

1313

def parse(self, text, readsubtree):

1314

selflazy = self._lazydirs

1314

selflazy = self._lazydirs

1315

subpath = self._subpath

1315

subpath = self._subpath

1316

for f, n, fl in _parse(text):

1316

for f, n, fl in _parse(text):

1317

if fl == b't':

1317

if fl == b't':

1318

f = f + b'/'

1318

f = f + b'/'

1319

# False below means "doesn't need to be copied" and can use the

1319

# False below means "doesn't need to be copied" and can use the

1320

# cached value from readsubtree directly.

1320

# cached value from readsubtree directly.

1321

selflazy[f] = (subpath(f), n, readsubtree, False)

1321

selflazy[f] = (subpath(f), n, readsubtree, False)

1322

elif b'/' in f:

1322

elif b'/' in f:

1323

# This is a flat manifest, so use __setitem__ and setflag rather

1323

# This is a flat manifest, so use __setitem__ and setflag rather

1324

# than assigning directly to _files and _flags, so we can

1324

# than assigning directly to _files and _flags, so we can

1325

# assign a path in a subdirectory, and to mark dirty (compared

1325

# assign a path in a subdirectory, and to mark dirty (compared

1326

# to nullid).

1326

# to nullid).

1327

self[f] = n

1327

self[f] = n

1328

if fl:

1328

if fl:

1329

self.setflag(f, fl)

1329

self.setflag(f, fl)

1330

else:

1330

else:

1331

# Assigning to _files and _flags avoids marking as dirty,

1331

# Assigning to _files and _flags avoids marking as dirty,

1332

# and should be a little faster.

1332

# and should be a little faster.

1333

self._files[f] = n

1333

self._files[f] = n

1334

if fl:

1334

if fl:

1335

self._flags[f] = fl

1335

self._flags[f] = fl

1336

1337

def text(self):

1337

def text(self):

1338

"""Get the full data of this manifest as a bytestring."""

1338

"""Get the full data of this manifest as a bytestring."""

1339

self._load()

1339

self._load()

1340

return _text(self.iterentries())

1340

return _text(self.iterentries())

1341

1342

def dirtext(self):

1342

def dirtext(self):

1343

"""Get the full data of this directory as a bytestring. Make sure that

1343

"""Get the full data of this directory as a bytestring. Make sure that

1344

any submanifests have been written first, so their nodeids are correct.

1344

any submanifests have been written first, so their nodeids are correct.

1345

"""

1345

"""

1346

self._load()

1346

self._load()

1347

flags = self.flags

1347

flags = self.flags

1348

lazydirs = [

1348

lazydirs = [

1349

(d[:-1], v[1], b't') for d, v in pycompat.iteritems(self._lazydirs)

1349

(d[:-1], v[1], b't') for d, v in pycompat.iteritems(self._lazydirs)

1350

]

1350

]

1351

dirs = [(d[:-1], self._dirs[d]._node, b't') for d in self._dirs]

1351

dirs = [(d[:-1], self._dirs[d]._node, b't') for d in self._dirs]

1352

files = [(f, self._files[f], flags(f)) for f in self._files]

1352

files = [(f, self._files[f], flags(f)) for f in self._files]

1353

return _text(sorted(dirs + files + lazydirs))

1353

return _text(sorted(dirs + files + lazydirs))

1354

1355

def read(self, gettext, readsubtree):

1355

def read(self, gettext, readsubtree):

1356

def _load_for_read(s):

1356

def _load_for_read(s):

1357

s.parse(gettext(), readsubtree)

1357

s.parse(gettext(), readsubtree)

1358

s._dirty = False

1358

s._dirty = False

1359

1360

self._loadfunc = _load_for_read

1360

self._loadfunc = _load_for_read

1361

1362

def writesubtrees(self, m1, m2, writesubtree, match):

1362

def writesubtrees(self, m1, m2, writesubtree, match):

1363

self._load() # for consistency; should never have any effect here

1363

self._load() # for consistency; should never have any effect here

1364

m1._load()

1364

m1._load()

1365

m2._load()

1365

m2._load()

1366

emptytree = treemanifest()

1366

emptytree = treemanifest()

1367

1368

def getnode(m, d):

1368

def getnode(m, d):

1369

ld = m._lazydirs.get(d)

1369

ld = m._lazydirs.get(d)

1370

if ld:

1370

if ld:

1371

return ld[1]

1371

return ld[1]

1372

return m._dirs.get(d, emptytree)._node

1372

return m._dirs.get(d, emptytree)._node

1373

1374

# let's skip investigating things that `match` says we do not need.

1374

# let's skip investigating things that `match` says we do not need.

1375

visit = match.visitchildrenset(self._dir[:-1])

1375

visit = match.visitchildrenset(self._dir[:-1])

1376

visit = self._loadchildrensetlazy(visit)

1376

visit = self._loadchildrensetlazy(visit)

1377

if visit == b'this' or visit == b'all':

1377

if visit == b'this' or visit == b'all':

1378

visit = None

1378

visit = None

1379

for d, subm in pycompat.iteritems(self._dirs):

1379

for d, subm in pycompat.iteritems(self._dirs):

1380

if visit and d[:-1] not in visit:

1380

if visit and d[:-1] not in visit:

1381

continue

1381

continue

1382

subp1 = getnode(m1, d)

1382

subp1 = getnode(m1, d)

1383

subp2 = getnode(m2, d)

1383

subp2 = getnode(m2, d)

1384

if subp1 == nullid:

1384

if subp1 == nullid:

1385

subp1, subp2 = subp2, subp1

1385

subp1, subp2 = subp2, subp1

1386

writesubtree(subm, subp1, subp2, match)

1386

writesubtree(subm, subp1, subp2, match)

1387

1388

def walksubtrees(self, matcher=None):

1388

def walksubtrees(self, matcher=None):

1389

"""Returns an iterator of the subtrees of this manifest, including this

1389

"""Returns an iterator of the subtrees of this manifest, including this

1390

manifest itself.

1390

manifest itself.

1391

1392

If `matcher` is provided, it only returns subtrees that match.

1392

If `matcher` is provided, it only returns subtrees that match.

1393

"""

1393

"""

1394

if matcher and not matcher.visitdir(self._dir[:-1]):

1394

if matcher and not matcher.visitdir(self._dir[:-1]):

1395

return

1395

return

1396

if not matcher or matcher(self._dir[:-1]):

1396

if not matcher or matcher(self._dir[:-1]):

1397

yield self

1397

yield self

1398

1399

self._load()

1399

self._load()

1400

# OPT: use visitchildrenset to avoid loading everything.

1400

# OPT: use visitchildrenset to avoid loading everything.

1401

self._loadalllazy()

1401

self._loadalllazy()

1402

for d, subm in pycompat.iteritems(self._dirs):

1402

for d, subm in pycompat.iteritems(self._dirs):

1403

for subtree in subm.walksubtrees(matcher=matcher):

1403

for subtree in subm.walksubtrees(matcher=matcher):

1404

yield subtree

1404

yield subtree

1405

1406

1407

class manifestfulltextcache(util.lrucachedict):

1407

class manifestfulltextcache(util.lrucachedict):

1408

"""File-backed LRU cache for the manifest cache

1408

"""File-backed LRU cache for the manifest cache

1409

1410

File consists of entries, up to EOF:

1410

File consists of entries, up to EOF:

1411

1412

- 20 bytes node, 4 bytes length, <length> manifest data

1412

- 20 bytes node, 4 bytes length, <length> manifest data

1413

1414

These are written in reverse cache order (oldest to newest).

1414

These are written in reverse cache order (oldest to newest).

1415

1416

"""

1416

"""

1417

1418

_file = b'manifestfulltextcache'

1418

_file = b'manifestfulltextcache'

1419

1420

def __init__(self, max):

1420

def __init__(self, max):

1421

super(manifestfulltextcache, self).__init__(max)

1421

super(manifestfulltextcache, self).__init__(max)

1422

self._dirty = False

1422

self._dirty = False

1423

self._read = False

1423

self._read = False

1424

self._opener = None

1424

self._opener = None

1425

1426

def read(self):

1426

def read(self):

1427

if self._read or self._opener is None:

1427

if self._read or self._opener is None:

1428

return

1428

return

1429

1430

try:

1430

try:

1431

with self._opener(self._file) as fp:

1431

with self._opener(self._file) as fp:

1432

set = super(manifestfulltextcache, self).__setitem__

1432

set = super(manifestfulltextcache, self).__setitem__

1433

# ignore trailing data, this is a cache, corruption is skipped

1433

# ignore trailing data, this is a cache, corruption is skipped

1434

while True:

1434

while True:

1435

# TODO do we need to do work here for sha1 portability?

1435

node = fp.read(20)

1436

node = fp.read(20)

1436

if len(node) < 20:

1437

if len(node) < 20:

1437

break

1438

break

1438

try:

1439

try:

1439

size = struct.unpack(b'>L', fp.read(4))[0]

1440

size = struct.unpack(b'>L', fp.read(4))[0]

1440

except struct.error:

1441

except struct.error:

1441

break

1442

break

1442

value = bytearray(fp.read(size))

1443

value = bytearray(fp.read(size))

1443

if len(value) != size:

1444

if len(value) != size:

1444

break

1445

break

1445

set(node, value)

1446

set(node, value)

1446

except IOError:

1447

except IOError:

1447

# the file is allowed to be missing

1448

# the file is allowed to be missing

1448

pass

1449

pass

1449

1450

self._read = True

1451

self._read = True

1451

self._dirty = False

1452

self._dirty = False

1452

1453

def write(self):

1454

def write(self):

1454

if not self._dirty or self._opener is None:

1455

if not self._dirty or self._opener is None:

1455

return

1456

return

1456

# rotate backwards to the first used node

1457

# rotate backwards to the first used node

1457

with self._opener(

1458

with self._opener(

1458

self._file, b'w', atomictemp=True, checkambig=True

1459

self._file, b'w', atomictemp=True, checkambig=True

1459

) as fp:

1460

) as fp:

1460

node = self._head.prev

1461

node = self._head.prev

1461

while True:

1462

while True:

1462

if node.key in self._cache:

1463

if node.key in self._cache:

1463

fp.write(node.key)

1464

fp.write(node.key)

1464

fp.write(struct.pack(b'>L', len(node.value)))

1465

fp.write(struct.pack(b'>L', len(node.value)))

1465

fp.write(node.value)

1466

fp.write(node.value)

1466

if node is self._head:

1467

if node is self._head:

1467

break

1468

break

1468

node = node.prev

1469

node = node.prev

1469

1470

def __len__(self):

1471

def __len__(self):

1471

if not self._read:

1472

if not self._read:

1472

self.read()

1473

self.read()

1473

return super(manifestfulltextcache, self).__len__()

1474

return super(manifestfulltextcache, self).__len__()

1474

1475

def __contains__(self, k):

1476

def __contains__(self, k):

1476

if not self._read:

1477

if not self._read:

1477

self.read()

1478

self.read()

1478

return super(manifestfulltextcache, self).__contains__(k)

1479

return super(manifestfulltextcache, self).__contains__(k)

1479

1480

def __iter__(self):

1481

def __iter__(self):

1481

if not self._read:

1482

if not self._read:

1482

self.read()

1483

self.read()

1483

return super(manifestfulltextcache, self).__iter__()

1484

return super(manifestfulltextcache, self).__iter__()

1484

1485

def __getitem__(self, k):

1486

def __getitem__(self, k):

1486

if not self._read:

1487

if not self._read:

1487

self.read()

1488

self.read()

1488

# the cache lru order can change on read

1489

# the cache lru order can change on read

1489

setdirty = self._cache.get(k) is not self._head

1490

setdirty = self._cache.get(k) is not self._head

1490

value = super(manifestfulltextcache, self).__getitem__(k)

1491

value = super(manifestfulltextcache, self).__getitem__(k)

1491

if setdirty:

1492

if setdirty:

1492

self._dirty = True

1493

self._dirty = True

1493

return value

1494

return value

1494

1495

def __setitem__(self, k, v):

1496

def __setitem__(self, k, v):

1496

if not self._read:

1497

if not self._read:

1497

self.read()

1498

self.read()

1498

super(manifestfulltextcache, self).__setitem__(k, v)

1499

super(manifestfulltextcache, self).__setitem__(k, v)

1499

self._dirty = True

1500

self._dirty = True

1500

1501

def __delitem__(self, k):

1502

def __delitem__(self, k):

1502

if not self._read:

1503

if not self._read:

1503

self.read()

1504

self.read()

1504

super(manifestfulltextcache, self).__delitem__(k)

1505

super(manifestfulltextcache, self).__delitem__(k)

1505

self._dirty = True

1506

self._dirty = True

1506

1507

def get(self, k, default=None):

1508

def get(self, k, default=None):

1508

if not self._read:

1509

if not self._read:

1509

self.read()

1510

self.read()

1510

return super(manifestfulltextcache, self).get(k, default=default)

1511

return super(manifestfulltextcache, self).get(k, default=default)

1511

1512

def clear(self, clear_persisted_data=False):

1513

def clear(self, clear_persisted_data=False):

1513

super(manifestfulltextcache, self).clear()

1514

super(manifestfulltextcache, self).clear()

1514

if clear_persisted_data:

1515

if clear_persisted_data:

1515

self._dirty = True

1516

self._dirty = True

1516

self.write()

1517

self.write()

1517

self._read = False

1518

self._read = False

1518

1519

1520

# and upper bound of what we expect from compression

1521

# and upper bound of what we expect from compression

1521

# (real live value seems to be "3")

1522

# (real live value seems to be "3")

1522

MAXCOMPRESSION = 3

1523

MAXCOMPRESSION = 3

1523

1524

1525

class FastdeltaUnavailable(Exception):

1526

class FastdeltaUnavailable(Exception):

1526

"""Exception raised when fastdelta isn't usable on a manifest."""

1527

"""Exception raised when fastdelta isn't usable on a manifest."""

1527

1528

1529

@interfaceutil.implementer(repository.imanifeststorage)

1530

@interfaceutil.implementer(repository.imanifeststorage)

1530

class manifestrevlog(object):

1531

class manifestrevlog(object):

1531

'''A revlog that stores manifest texts. This is responsible for caching the

1532

'''A revlog that stores manifest texts. This is responsible for caching the

1532

full-text manifest contents.

1533

full-text manifest contents.

1533

'''

1534

'''

1534

1535

def __init__(

1536

def __init__(

1536

self,

1537

self,

1537

opener,

1538

opener,

1538

tree=b'',

1539

tree=b'',

1539

dirlogcache=None,

1540

dirlogcache=None,

1540

indexfile=None,

1541

indexfile=None,

1541

treemanifest=False,

1542

treemanifest=False,

1542

):

1543

):

1543

"""Constructs a new manifest revlog

1544

"""Constructs a new manifest revlog

1544

1545

`indexfile` - used by extensions to have two manifests at once, like

1546

`indexfile` - used by extensions to have two manifests at once, like

1546

when transitioning between flatmanifeset and treemanifests.

1547

when transitioning between flatmanifeset and treemanifests.

1547

1548

`treemanifest` - used to indicate this is a tree manifest revlog. Opener

1549

`treemanifest` - used to indicate this is a tree manifest revlog. Opener

1549

options can also be used to make this a tree manifest revlog. The opener

1550

options can also be used to make this a tree manifest revlog. The opener

1550

option takes precedence, so if it is set to True, we ignore whatever

1551

option takes precedence, so if it is set to True, we ignore whatever

1551

value is passed in to the constructor.

1552

value is passed in to the constructor.

1552

"""

1553

"""

1553

# During normal operations, we expect to deal with not more than four

1554

# During normal operations, we expect to deal with not more than four

1554

# revs at a time (such as during commit --amend). When rebasing large

1555

# revs at a time (such as during commit --amend). When rebasing large

1555

# stacks of commits, the number can go up, hence the config knob below.

1556

# stacks of commits, the number can go up, hence the config knob below.

1556

cachesize = 4

1557

cachesize = 4

1557

optiontreemanifest = False

1558

optiontreemanifest = False

1558

opts = getattr(opener, 'options', None)

1559

opts = getattr(opener, 'options', None)

1559

if opts is not None:

1560

if opts is not None:

1560

cachesize = opts.get(b'manifestcachesize', cachesize)

1561

cachesize = opts.get(b'manifestcachesize', cachesize)

1561

optiontreemanifest = opts.get(b'treemanifest', False)

1562

optiontreemanifest = opts.get(b'treemanifest', False)

1562

1563

self._treeondisk = optiontreemanifest or treemanifest

1564

self._treeondisk = optiontreemanifest or treemanifest

1564

1565

self._fulltextcache = manifestfulltextcache(cachesize)

1566

self._fulltextcache = manifestfulltextcache(cachesize)

1566

1567

if tree:

1568

if tree:

1568

assert self._treeondisk, b'opts is %r' % opts

1569

assert self._treeondisk, b'opts is %r' % opts

1569

1570

if indexfile is None:

1571

if indexfile is None:

1571

indexfile = b'00manifest.i'

1572

indexfile = b'00manifest.i'

1572

if tree:

1573

if tree:

1573

indexfile = b"meta/" + tree + indexfile

1574

indexfile = b"meta/" + tree + indexfile

1574

1575

self.tree = tree

1576

self.tree = tree

1576

1577

# The dirlogcache is kept on the root manifest log

1578

# The dirlogcache is kept on the root manifest log

1578

if tree:

1579

if tree:

1579

self._dirlogcache = dirlogcache

1580

self._dirlogcache = dirlogcache

1580

else:

1581

else:

1581

self._dirlogcache = {b'': self}

1582

self._dirlogcache = {b'': self}

1582

1583

self._revlog = revlog.revlog(

1584

self._revlog = revlog.revlog(

1584

opener,

1585

opener,

1585

indexfile,

1586

indexfile,

1586

# only root indexfile is cached

1587

# only root indexfile is cached

1587

checkambig=not bool(tree),

1588

checkambig=not bool(tree),

1588

mmaplargeindex=True,

1589

mmaplargeindex=True,

1589

upperboundcomp=MAXCOMPRESSION,

1590

upperboundcomp=MAXCOMPRESSION,

1590

)

1591

)

1591

1592

self.index = self._revlog.index

1593

self.index = self._revlog.index

1593

self.version = self._revlog.version

1594

self.version = self._revlog.version

1594

self._generaldelta = self._revlog._generaldelta

1595

self._generaldelta = self._revlog._generaldelta

1595

1596

def _setupmanifestcachehooks(self, repo):

1597

def _setupmanifestcachehooks(self, repo):

1597

"""Persist the manifestfulltextcache on lock release"""

1598

"""Persist the manifestfulltextcache on lock release"""

1598

if not util.safehasattr(repo, b'_wlockref'):

1599

if not util.safehasattr(repo, b'_wlockref'):

1599

return

1600

return

1600

1601

self._fulltextcache._opener = repo.wcachevfs

1602

self._fulltextcache._opener = repo.wcachevfs

1602

if repo._currentlock(repo._wlockref) is None:

1603

if repo._currentlock(repo._wlockref) is None:

1603

return

1604

return

1604

1605

reporef = weakref.ref(repo)

1606

reporef = weakref.ref(repo)

1606

manifestrevlogref = weakref.ref(self)

1607

manifestrevlogref = weakref.ref(self)

1607

1608

def persistmanifestcache(success):

1609

def persistmanifestcache(success):

1609

# Repo is in an unknown state, do not persist.

1610

# Repo is in an unknown state, do not persist.

1610

if not success:

1611

if not success:

1611

return

1612

return

1612

1613

repo = reporef()

1614

repo = reporef()

1614

self = manifestrevlogref()

1615

self = manifestrevlogref()

1615

if repo is None or self is None:

1616

if repo is None or self is None:

1616

return

1617

return

1617

if repo.manifestlog.getstorage(b'') is not self:

1618

if repo.manifestlog.getstorage(b'') is not self:

1618

# there's a different manifest in play now, abort

1619

# there's a different manifest in play now, abort

1619

return

1620

return

1620

self._fulltextcache.write()

1621

self._fulltextcache.write()

1621

1622

repo._afterlock(persistmanifestcache)

1623

repo._afterlock(persistmanifestcache)

1623

1624

@property

1625

@property

1625

def fulltextcache(self):

1626

def fulltextcache(self):

1626

return self._fulltextcache

1627

return self._fulltextcache

1627

1628

def clearcaches(self, clear_persisted_data=False):

1629

def clearcaches(self, clear_persisted_data=False):

1629

self._revlog.clearcaches()

1630

self._revlog.clearcaches()

1630

self._fulltextcache.clear(clear_persisted_data=clear_persisted_data)

1631

self._fulltextcache.clear(clear_persisted_data=clear_persisted_data)

1631

self._dirlogcache = {self.tree: self}

1632

self._dirlogcache = {self.tree: self}

1632

1633

def dirlog(self, d):

1634

def dirlog(self, d):

1634

if d:

1635

if d:

1635

assert self._treeondisk

1636

assert self._treeondisk

1636

if d not in self._dirlogcache:

1637

if d not in self._dirlogcache:

1637

mfrevlog = manifestrevlog(

1638

mfrevlog = manifestrevlog(

1638

self.opener, d, self._dirlogcache, treemanifest=self._treeondisk

1639

self.opener, d, self._dirlogcache, treemanifest=self._treeondisk

1639

)

1640

)

1640

self._dirlogcache[d] = mfrevlog

1641

self._dirlogcache[d] = mfrevlog

1641

return self._dirlogcache[d]

1642

return self._dirlogcache[d]

1642

1643

def add(

1644

def add(

1644

self,

1645

self,

1645

m,

1646

m,

1646

transaction,

1647

transaction,

1647

link,

1648

link,

1648

p1,

1649

p1,

1649

p2,

1650

p2,

1650

added,

1651

added,

1651

removed,

1652

removed,

1652

readtree=None,

1653

readtree=None,

1653

match=None,

1654

match=None,

1654

):

1655

):

1655

try:

1656

try:

1656

if p1 not in self.fulltextcache:

1657

if p1 not in self.fulltextcache:

1657

raise FastdeltaUnavailable()

1658

raise FastdeltaUnavailable()

1658

# If our first parent is in the manifest cache, we can

1659

# If our first parent is in the manifest cache, we can

1659

# compute a delta here using properties we know about the

1660

# compute a delta here using properties we know about the

1660

# manifest up-front, which may save time later for the

1661

# manifest up-front, which may save time later for the

1661

# revlog layer.

1662

# revlog layer.

1662

1663

_checkforbidden(added)

1664

_checkforbidden(added)

1664

# combine the changed lists into one sorted iterator

1665

# combine the changed lists into one sorted iterator

1665

work = heapq.merge(

1666

work = heapq.merge(

1666

[(x, False) for x in sorted(added)],

1667

[(x, False) for x in sorted(added)],

1667

[(x, True) for x in sorted(removed)],

1668

[(x, True) for x in sorted(removed)],

1668

)

1669

)

1669

1670

arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)

1671

arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)

1671

cachedelta = self._revlog.rev(p1), deltatext

1672

cachedelta = self._revlog.rev(p1), deltatext

1672

text = util.buffer(arraytext)

1673

text = util.buffer(arraytext)

1673

n = self._revlog.addrevision(

1674

n = self._revlog.addrevision(

1674

text, transaction, link, p1, p2, cachedelta

1675

text, transaction, link, p1, p2, cachedelta

1675

)

1676

)

1676

except FastdeltaUnavailable:

1677

except FastdeltaUnavailable:

1677

# The first parent manifest isn't already loaded or the

1678

# The first parent manifest isn't already loaded or the

1678

# manifest implementation doesn't support fastdelta, so

1679

# manifest implementation doesn't support fastdelta, so

1679

# we'll just encode a fulltext of the manifest and pass

1680

# we'll just encode a fulltext of the manifest and pass

1680

# that through to the revlog layer, and let it handle the

1681

# that through to the revlog layer, and let it handle the

1681

# delta process.

1682

# delta process.

1682

if self._treeondisk:

1683

if self._treeondisk:

1683

assert readtree, b"readtree must be set for treemanifest writes"

1684

assert readtree, b"readtree must be set for treemanifest writes"

1684

assert match, b"match must be specified for treemanifest writes"

1685

assert match, b"match must be specified for treemanifest writes"

1685

m1 = readtree(self.tree, p1)

1686

m1 = readtree(self.tree, p1)

1686

m2 = readtree(self.tree, p2)

1687

m2 = readtree(self.tree, p2)

1687

n = self._addtree(

1688

n = self._addtree(

1688

m, transaction, link, m1, m2, readtree, match=match

1689

m, transaction, link, m1, m2, readtree, match=match

1689

)

1690

)

1690

arraytext = None

1691

arraytext = None

1691

else:

1692

else:

1692

text = m.text()

1693

text = m.text()

1693

n = self._revlog.addrevision(text, transaction, link, p1, p2)

1694

n = self._revlog.addrevision(text, transaction, link, p1, p2)

1694

arraytext = bytearray(text)

1695

arraytext = bytearray(text)

1695

1696

if arraytext is not None:

1697

if arraytext is not None:

1697

self.fulltextcache[n] = arraytext

1698

self.fulltextcache[n] = arraytext

1698

1699

return n

1700

return n

1700

1701

def _addtree(self, m, transaction, link, m1, m2, readtree, match):

1702

def _addtree(self, m, transaction, link, m1, m2, readtree, match):

1702

# If the manifest is unchanged compared to one parent,

1703

# If the manifest is unchanged compared to one parent,

1703

# don't write a new revision

1704

# don't write a new revision

1704

if self.tree != b'' and (

1705

if self.tree != b'' and (

1705

m.unmodifiedsince(m1) or m.unmodifiedsince(m2)

1706

m.unmodifiedsince(m1) or m.unmodifiedsince(m2)

1706

):

1707

):

1707

return m.node()

1708

return m.node()

1708

1709

def writesubtree(subm, subp1, subp2, match):

1710

def writesubtree(subm, subp1, subp2, match):

1710

sublog = self.dirlog(subm.dir())

1711

sublog = self.dirlog(subm.dir())

1711

sublog.add(

1712

sublog.add(

1712

subm,

1713

subm,

1713

transaction,

1714

transaction,

1714

link,

1715

link,

1715

subp1,

1716

subp1,

1716

subp2,

1717

subp2,

1717

None,

1718

None,

1718

None,

1719

None,

1719

readtree=readtree,

1720

readtree=readtree,

1720

match=match,

1721

match=match,

1721

)

1722

)

1722

1723

m.writesubtrees(m1, m2, writesubtree, match)

1724

m.writesubtrees(m1, m2, writesubtree, match)

1724

text = m.dirtext()

1725

text = m.dirtext()

1725

n = None

1726

n = None

1726

if self.tree != b'':

1727

if self.tree != b'':

1727

# Double-check whether contents are unchanged to one parent

1728

# Double-check whether contents are unchanged to one parent

1728

if text == m1.dirtext():

1729

if text == m1.dirtext():

1729

n = m1.node()

1730

n = m1.node()

1730

elif text == m2.dirtext():

1731

elif text == m2.dirtext():

1731

n = m2.node()

1732

n = m2.node()

1732

1733

if not n:

1734

if not n:

1734

n = self._revlog.addrevision(

1735

n = self._revlog.addrevision(

1735

text, transaction, link, m1.node(), m2.node()

1736

text, transaction, link, m1.node(), m2.node()

1736

)

1737

)

1737

1738

# Save nodeid so parent manifest can calculate its nodeid

1739

# Save nodeid so parent manifest can calculate its nodeid

1739

m.setnode(n)

1740

m.setnode(n)

1740

return n

1741

return n

1741

1742

def __len__(self):

1743

def __len__(self):

1743

return len(self._revlog)

1744

return len(self._revlog)

1744

1745

def __iter__(self):

1746

def __iter__(self):

1746

return self._revlog.__iter__()

1747

return self._revlog.__iter__()

1747

1748

def rev(self, node):

1749

def rev(self, node):

1749

return self._revlog.rev(node)

1750

return self._revlog.rev(node)

1750

1751

def node(self, rev):

1752

def node(self, rev):

1752

return self._revlog.node(rev)

1753

return self._revlog.node(rev)

1753

1754

def lookup(self, value):

1755

def lookup(self, value):

1755

return self._revlog.lookup(value)

1756

return self._revlog.lookup(value)

1756

1757

def parentrevs(self, rev):

1758

def parentrevs(self, rev):

1758

return self._revlog.parentrevs(rev)

1759

return self._revlog.parentrevs(rev)

1759

1760

def parents(self, node):

1761

def parents(self, node):

1761

return self._revlog.parents(node)

1762

return self._revlog.parents(node)

1762

1763

def linkrev(self, rev):

1764

def linkrev(self, rev):

1764

return self._revlog.linkrev(rev)

1765

return self._revlog.linkrev(rev)

1765

1766

def checksize(self):

1767

def checksize(self):

1767

return self._revlog.checksize()

1768

return self._revlog.checksize()

1768

1769

def revision(self, node, _df=None, raw=False):

1770

def revision(self, node, _df=None, raw=False):

1770

return self._revlog.revision(node, _df=_df, raw=raw)

1771

return self._revlog.revision(node, _df=_df, raw=raw)

1771

1772

def rawdata(self, node, _df=None):

1773

def rawdata(self, node, _df=None):

1773

return self._revlog.rawdata(node, _df=_df)

1774

return self._revlog.rawdata(node, _df=_df)

1774

1775

def revdiff(self, rev1, rev2):

1776

def revdiff(self, rev1, rev2):

1776

return self._revlog.revdiff(rev1, rev2)

1777

return self._revlog.revdiff(rev1, rev2)

1777

1778

def cmp(self, node, text):

1779

def cmp(self, node, text):

1779

return self._revlog.cmp(node, text)

1780

return self._revlog.cmp(node, text)

1780

1781

def deltaparent(self, rev):

1782

def deltaparent(self, rev):

1782

return self._revlog.deltaparent(rev)

1783

return self._revlog.deltaparent(rev)

1783

1784

def emitrevisions(

1785

def emitrevisions(

1785

self,

1786

self,

1786

nodes,

1787

nodes,

1787

nodesorder=None,

1788

nodesorder=None,

1788

revisiondata=False,

1789

revisiondata=False,

1789

assumehaveparentrevisions=False,

1790

assumehaveparentrevisions=False,

1790

deltamode=repository.CG_DELTAMODE_STD,

1791

deltamode=repository.CG_DELTAMODE_STD,

1791

):

1792

):

1792

return self._revlog.emitrevisions(

1793

return self._revlog.emitrevisions(

1793

nodes,

1794

nodes,

1794

nodesorder=nodesorder,

1795

nodesorder=nodesorder,

1795

revisiondata=revisiondata,

1796

revisiondata=revisiondata,

1796

assumehaveparentrevisions=assumehaveparentrevisions,

1797

assumehaveparentrevisions=assumehaveparentrevisions,

1797

deltamode=deltamode,

1798

deltamode=deltamode,

1798

)

1799

)

1799

1800

def addgroup(self, deltas, linkmapper, transaction, addrevisioncb=None):

1801

def addgroup(self, deltas, linkmapper, transaction, addrevisioncb=None):

1801

return self._revlog.addgroup(

1802

return self._revlog.addgroup(

1802

deltas, linkmapper, transaction, addrevisioncb=addrevisioncb

1803

deltas, linkmapper, transaction, addrevisioncb=addrevisioncb

1803

)

1804

)

1804

1805

def rawsize(self, rev):

1806

def rawsize(self, rev):

1806

return self._revlog.rawsize(rev)

1807

return self._revlog.rawsize(rev)

1807

1808

def getstrippoint(self, minlink):

1809

def getstrippoint(self, minlink):

1809

return self._revlog.getstrippoint(minlink)

1810

return self._revlog.getstrippoint(minlink)

1810

1811

def strip(self, minlink, transaction):

1812

def strip(self, minlink, transaction):

1812

return self._revlog.strip(minlink, transaction)

1813

return self._revlog.strip(minlink, transaction)

1813

1814

def files(self):

1815

def files(self):

1815

return self._revlog.files()

1816

return self._revlog.files()

1816

1817

def clone(self, tr, destrevlog, **kwargs):

1818

def clone(self, tr, destrevlog, **kwargs):

1818

if not isinstance(destrevlog, manifestrevlog):

1819

if not isinstance(destrevlog, manifestrevlog):

1819

raise error.ProgrammingError(b'expected manifestrevlog to clone()')

1820

raise error.ProgrammingError(b'expected manifestrevlog to clone()')

1820

1821

return self._revlog.clone(tr, destrevlog._revlog, **kwargs)

1822

return self._revlog.clone(tr, destrevlog._revlog, **kwargs)

1822

1823

def storageinfo(

1824

def storageinfo(

1824

self,

1825

self,

1825

exclusivefiles=False,

1826

exclusivefiles=False,

1826

sharedfiles=False,

1827

sharedfiles=False,

1827

revisionscount=False,

1828

revisionscount=False,

1828

trackedsize=False,

1829

trackedsize=False,

1829

storedsize=False,

1830

storedsize=False,

1830

):

1831

):

1831

return self._revlog.storageinfo(

1832

return self._revlog.storageinfo(

1832

exclusivefiles=exclusivefiles,

1833

exclusivefiles=exclusivefiles,

1833

sharedfiles=sharedfiles,

1834

sharedfiles=sharedfiles,

1834

revisionscount=revisionscount,

1835

revisionscount=revisionscount,

1835

trackedsize=trackedsize,

1836

trackedsize=trackedsize,

1836

storedsize=storedsize,

1837

storedsize=storedsize,

1837

)

1838

)

1838

1839

@property

1840

@property

1840

def indexfile(self):

1841

def indexfile(self):

1841

return self._revlog.indexfile

1842

return self._revlog.indexfile

1842

1843

@indexfile.setter

1844

@indexfile.setter

1844

def indexfile(self, value):

1845

def indexfile(self, value):

1845

self._revlog.indexfile = value

1846

self._revlog.indexfile = value

1846

1847

@property

1848

@property

1848

def opener(self):

1849

def opener(self):

1849

return self._revlog.opener

1850

return self._revlog.opener

1850

1851

@opener.setter

1852

@opener.setter

1852

def opener(self, value):

1853

def opener(self, value):

1853

self._revlog.opener = value

1854

self._revlog.opener = value

1854

1855

1856

@interfaceutil.implementer(repository.imanifestlog)

1857

@interfaceutil.implementer(repository.imanifestlog)

1857

class manifestlog(object):

1858

class manifestlog(object):

1858

"""A collection class representing the collection of manifest snapshots

1859

"""A collection class representing the collection of manifest snapshots

1859

referenced by commits in the repository.

1860

referenced by commits in the repository.

1860

1861

In this situation, 'manifest' refers to the abstract concept of a snapshot

1862

In this situation, 'manifest' refers to the abstract concept of a snapshot

1862

of the list of files in the given commit. Consumers of the output of this

1863

of the list of files in the given commit. Consumers of the output of this

1863

class do not care about the implementation details of the actual manifests

1864

class do not care about the implementation details of the actual manifests

1864

they receive (i.e. tree or flat or lazily loaded, etc)."""

1865

they receive (i.e. tree or flat or lazily loaded, etc)."""

1865

1866

def __init__(self, opener, repo, rootstore, narrowmatch):

1867

def __init__(self, opener, repo, rootstore, narrowmatch):

1867

usetreemanifest = False

1868

usetreemanifest = False

1868

cachesize = 4

1869

cachesize = 4

1869

1870

opts = getattr(opener, 'options', None)

1871

opts = getattr(opener, 'options', None)

1871

if opts is not None:

1872

if opts is not None:

1872

usetreemanifest = opts.get(b'treemanifest', usetreemanifest)

1873

usetreemanifest = opts.get(b'treemanifest', usetreemanifest)

1873

cachesize = opts.get(b'manifestcachesize', cachesize)

1874

cachesize = opts.get(b'manifestcachesize', cachesize)

1874

1875

self._treemanifests = usetreemanifest

1876

self._treemanifests = usetreemanifest

1876

1877

self._rootstore = rootstore

1878

self._rootstore = rootstore

1878

self._rootstore._setupmanifestcachehooks(repo)

1879

self._rootstore._setupmanifestcachehooks(repo)

1879

self._narrowmatch = narrowmatch

1880

self._narrowmatch = narrowmatch

1880

1881

# A cache of the manifestctx or treemanifestctx for each directory

1882

# A cache of the manifestctx or treemanifestctx for each directory

1882

self._dirmancache = {}

1883

self._dirmancache = {}

1883

self._dirmancache[b''] = util.lrucachedict(cachesize)

1884

self._dirmancache[b''] = util.lrucachedict(cachesize)

1884

1885

self._cachesize = cachesize

1886

self._cachesize = cachesize

1886

1887

def __getitem__(self, node):

1888

def __getitem__(self, node):

1888

"""Retrieves the manifest instance for the given node. Throws a

1889

"""Retrieves the manifest instance for the given node. Throws a

1889

LookupError if not found.

1890

LookupError if not found.

1890

"""

1891

"""

1891

return self.get(b'', node)

1892

return self.get(b'', node)

1892

1893

def get(self, tree, node, verify=True):

1894

def get(self, tree, node, verify=True):

1894

"""Retrieves the manifest instance for the given node. Throws a

1895

"""Retrieves the manifest instance for the given node. Throws a

1895

LookupError if not found.

1896

LookupError if not found.

1896

1897

`verify` - if True an exception will be thrown if the node is not in

1898

`verify` - if True an exception will be thrown if the node is not in

1898

the revlog

1899

the revlog

1899

"""

1900

"""

1900

if node in self._dirmancache.get(tree, ()):

1901

if node in self._dirmancache.get(tree, ()):

1901

return self._dirmancache[tree][node]

1902

return self._dirmancache[tree][node]

1902

1903

if not self._narrowmatch.always():

1904

if not self._narrowmatch.always():

1904

if not self._narrowmatch.visitdir(tree[:-1]):

1905

if not self._narrowmatch.visitdir(tree[:-1]):

1905

return excludeddirmanifestctx(tree, node)

1906

return excludeddirmanifestctx(tree, node)

1906

if tree:

1907

if tree:

1907

if self._rootstore._treeondisk:

1908

if self._rootstore._treeondisk:

1908

if verify:

1909

if verify:

1909

# Side-effect is LookupError is raised if node doesn't

1910

# Side-effect is LookupError is raised if node doesn't

1910

# exist.

1911

# exist.

1911

self.getstorage(tree).rev(node)

1912

self.getstorage(tree).rev(node)

1912

1913

m = treemanifestctx(self, tree, node)

1914

m = treemanifestctx(self, tree, node)

1914

else:

1915

else:

1915

raise error.Abort(

1916

raise error.Abort(

1916

_(

1917

_(

1917

b"cannot ask for manifest directory '%s' in a flat "

1918

b"cannot ask for manifest directory '%s' in a flat "

1918

b"manifest"

1919

b"manifest"

1919

)

1920

)

1920

% tree

1921

% tree

1921

)

1922

)

1922

else:

1923

else:

1923

if verify:

1924

if verify:

1924

# Side-effect is LookupError is raised if node doesn't exist.

1925

# Side-effect is LookupError is raised if node doesn't exist.

1925

self._rootstore.rev(node)

1926

self._rootstore.rev(node)

1926

1927

if self._treemanifests:

1928

if self._treemanifests:

1928

m = treemanifestctx(self, b'', node)

1929

m = treemanifestctx(self, b'', node)

1929

else:

1930

else:

1930

m = manifestctx(self, node)

1931

m = manifestctx(self, node)

1931

1932

if node != nullid:

1933

if node != nullid:

1933

mancache = self._dirmancache.get(tree)

1934

mancache = self._dirmancache.get(tree)

1934

if not mancache:

1935

if not mancache:

1935

mancache = util.lrucachedict(self._cachesize)

1936

mancache = util.lrucachedict(self._cachesize)

1936

self._dirmancache[tree] = mancache

1937

self._dirmancache[tree] = mancache

1937

mancache[node] = m

1938

mancache[node] = m

1938

return m

1939

return m

1939

1940

def getstorage(self, tree):

1941

def getstorage(self, tree):

1941

return self._rootstore.dirlog(tree)

1942

return self._rootstore.dirlog(tree)

1942

1943

def clearcaches(self, clear_persisted_data=False):

1944

def clearcaches(self, clear_persisted_data=False):

1944

self._dirmancache.clear()

1945

self._dirmancache.clear()

1945

self._rootstore.clearcaches(clear_persisted_data=clear_persisted_data)

1946

self._rootstore.clearcaches(clear_persisted_data=clear_persisted_data)

1946

1947

def rev(self, node):

1948

def rev(self, node):

1948

return self._rootstore.rev(node)

1949

return self._rootstore.rev(node)

1949

1950

1951

@interfaceutil.implementer(repository.imanifestrevisionwritable)

1952

@interfaceutil.implementer(repository.imanifestrevisionwritable)

1952

class memmanifestctx(object):

1953

class memmanifestctx(object):

1953

def __init__(self, manifestlog):

1954

def __init__(self, manifestlog):

1954

self._manifestlog = manifestlog

1955

self._manifestlog = manifestlog

1955

self._manifestdict = manifestdict()

1956

self._manifestdict = manifestdict()

1956

1957

def _storage(self):

1958

def _storage(self):

1958

return self._manifestlog.getstorage(b'')

1959

return self._manifestlog.getstorage(b'')

1959

1960

def copy(self):

1961

def copy(self):

1961

memmf = memmanifestctx(self._manifestlog)

1962

memmf = memmanifestctx(self._manifestlog)

1962

memmf._manifestdict = self.read().copy()

1963

memmf._manifestdict = self.read().copy()

1963

return memmf

1964

return memmf

1964

1965

def read(self):

1966

def read(self):

1966

return self._manifestdict

1967

return self._manifestdict

1967

1968

def write(self, transaction, link, p1, p2, added, removed, match=None):

1969

def write(self, transaction, link, p1, p2, added, removed, match=None):

1969

return self._storage().add(

1970

return self._storage().add(

1970

self._manifestdict,

1971

self._manifestdict,

1971

transaction,

1972

transaction,

1972

link,

1973

link,

1973

p1,

1974

p1,

1974

p2,

1975

p2,

1975

added,

1976

added,

1976

removed,

1977

removed,

1977

match=match,

1978

match=match,

1978

)

1979

)

1979

1980

1981

@interfaceutil.implementer(repository.imanifestrevisionstored)

1982

@interfaceutil.implementer(repository.imanifestrevisionstored)

1982

class manifestctx(object):

1983

class manifestctx(object):

1983

"""A class representing a single revision of a manifest, including its

1984

"""A class representing a single revision of a manifest, including its

1984

contents, its parent revs, and its linkrev.

1985

contents, its parent revs, and its linkrev.

1985

"""

1986

"""

1986

1987

def __init__(self, manifestlog, node):

1988

def __init__(self, manifestlog, node):

1988

self._manifestlog = manifestlog

1989

self._manifestlog = manifestlog

1989

self._data = None

1990

self._data = None

1990

1991

self._node = node

1992

self._node = node

1992

1993

# TODO: We eventually want p1, p2, and linkrev exposed on this class,

1994

# TODO: We eventually want p1, p2, and linkrev exposed on this class,

1994

# but let's add it later when something needs it and we can load it

1995

# but let's add it later when something needs it and we can load it

1995

# lazily.

1996

# lazily.

1996

# self.p1, self.p2 = store.parents(node)

1997

# self.p1, self.p2 = store.parents(node)

1997

# rev = store.rev(node)

1998

# rev = store.rev(node)

1998

# self.linkrev = store.linkrev(rev)

1999

# self.linkrev = store.linkrev(rev)

1999

2000

def _storage(self):

2001

def _storage(self):

2001

return self._manifestlog.getstorage(b'')

2002

return self._manifestlog.getstorage(b'')

2002

2003

def node(self):

2004

def node(self):

2004

return self._node

2005

return self._node

2005

2006

def copy(self):

2007

def copy(self):

2007

memmf = memmanifestctx(self._manifestlog)

2008

memmf = memmanifestctx(self._manifestlog)

2008

memmf._manifestdict = self.read().copy()

2009

memmf._manifestdict = self.read().copy()

2009

return memmf

2010

return memmf

2010

2011

@propertycache

2012

@propertycache

2012

def parents(self):

2013

def parents(self):

2013

return self._storage().parents(self._node)

2014

return self._storage().parents(self._node)

2014

2015

def read(self):

2016

def read(self):

2016

if self._data is None:

2017

if self._data is None:

2017

if self._node == nullid:

2018

if self._node == nullid:

2018

self._data = manifestdict()

2019

self._data = manifestdict()

2019

else:

2020

else:

2020

store = self._storage()

2021

store = self._storage()

2021

if self._node in store.fulltextcache:

2022

if self._node in store.fulltextcache:

2022

text = pycompat.bytestr(store.fulltextcache[self._node])

2023

text = pycompat.bytestr(store.fulltextcache[self._node])

2023

else:

2024

else:

2024

text = store.revision(self._node)

2025

text = store.revision(self._node)

2025

arraytext = bytearray(text)

2026

arraytext = bytearray(text)

2026

store.fulltextcache[self._node] = arraytext

2027

store.fulltextcache[self._node] = arraytext

2027

self._data = manifestdict(text)

2028

self._data = manifestdict(text)

2028

return self._data

2029

return self._data

2029

2030

def readfast(self, shallow=False):

2031

def readfast(self, shallow=False):

2031

'''Calls either readdelta or read, based on which would be less work.

2032

'''Calls either readdelta or read, based on which would be less work.

2032

readdelta is called if the delta is against the p1, and therefore can be

2033

readdelta is called if the delta is against the p1, and therefore can be

2033

read quickly.

2034

read quickly.

2034

2035

If `shallow` is True, nothing changes since this is a flat manifest.

2036

If `shallow` is True, nothing changes since this is a flat manifest.

2036

'''

2037

'''

2037

store = self._storage()

2038

store = self._storage()

2038

r = store.rev(self._node)

2039

r = store.rev(self._node)

2039

deltaparent = store.deltaparent(r)

2040

deltaparent = store.deltaparent(r)

2040

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2041

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2041

return self.readdelta()

2042

return self.readdelta()

2042

return self.read()

2043

return self.read()

2043

2044

def readdelta(self, shallow=False):

2045

def readdelta(self, shallow=False):

2045

'''Returns a manifest containing just the entries that are present

2046

'''Returns a manifest containing just the entries that are present

2046

in this manifest, but not in its p1 manifest. This is efficient to read

2047

in this manifest, but not in its p1 manifest. This is efficient to read

2047

if the revlog delta is already p1.

2048

if the revlog delta is already p1.

2048

2049

Changing the value of `shallow` has no effect on flat manifests.

2050

Changing the value of `shallow` has no effect on flat manifests.

2050

'''

2051

'''

2051

store = self._storage()

2052

store = self._storage()

2052

r = store.rev(self._node)

2053

r = store.rev(self._node)

2053

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2054

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2054

return manifestdict(d)

2055

return manifestdict(d)

2055

2056

def find(self, key):

2057

def find(self, key):

2057

return self.read().find(key)

2058

return self.read().find(key)

2058

2059

2060

@interfaceutil.implementer(repository.imanifestrevisionwritable)

2061

@interfaceutil.implementer(repository.imanifestrevisionwritable)

2061

class memtreemanifestctx(object):

2062

class memtreemanifestctx(object):

2062

def __init__(self, manifestlog, dir=b''):

2063

def __init__(self, manifestlog, dir=b''):

2063

self._manifestlog = manifestlog

2064

self._manifestlog = manifestlog

2064

self._dir = dir

2065

self._dir = dir

2065

self._treemanifest = treemanifest()

2066

self._treemanifest = treemanifest()

2066

2067

def _storage(self):

2068

def _storage(self):

2068

return self._manifestlog.getstorage(b'')

2069

return self._manifestlog.getstorage(b'')

2069

2070

def copy(self):

2071

def copy(self):

2071

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2072

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2072

memmf._treemanifest = self._treemanifest.copy()

2073

memmf._treemanifest = self._treemanifest.copy()

2073

return memmf

2074

return memmf

2074

2075

def read(self):

2076

def read(self):

2076

return self._treemanifest

2077

return self._treemanifest

2077

2078

def write(self, transaction, link, p1, p2, added, removed, match=None):

2079

def write(self, transaction, link, p1, p2, added, removed, match=None):

2079

def readtree(dir, node):

2080

def readtree(dir, node):

2080

return self._manifestlog.get(dir, node).read()

2081

return self._manifestlog.get(dir, node).read()

2081

2082

return self._storage().add(

2083

return self._storage().add(

2083

self._treemanifest,

2084

self._treemanifest,

2084

transaction,

2085

transaction,

2085

link,

2086

link,

2086

p1,

2087

p1,

2087

p2,

2088

p2,

2088

added,

2089

added,

2089

removed,

2090

removed,

2090

readtree=readtree,

2091

readtree=readtree,

2091

match=match,

2092

match=match,

2092

)

2093

)

2093

2094

2095

@interfaceutil.implementer(repository.imanifestrevisionstored)

2096

@interfaceutil.implementer(repository.imanifestrevisionstored)

2096

class treemanifestctx(object):

2097

class treemanifestctx(object):

2097

def __init__(self, manifestlog, dir, node):

2098

def __init__(self, manifestlog, dir, node):

2098

self._manifestlog = manifestlog

2099

self._manifestlog = manifestlog

2099

self._dir = dir

2100

self._dir = dir

2100

self._data = None

2101

self._data = None

2101

2102

self._node = node

2103

self._node = node

2103

2104

# TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that

2105

# TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that

2105

# we can instantiate treemanifestctx objects for directories we don't

2106

# we can instantiate treemanifestctx objects for directories we don't

2106

# have on disk.

2107

# have on disk.

2107

# self.p1, self.p2 = store.parents(node)

2108

# self.p1, self.p2 = store.parents(node)

2108

# rev = store.rev(node)

2109

# rev = store.rev(node)

2109

# self.linkrev = store.linkrev(rev)

2110

# self.linkrev = store.linkrev(rev)

2110

2111

def _storage(self):

2112

def _storage(self):

2112

narrowmatch = self._manifestlog._narrowmatch

2113

narrowmatch = self._manifestlog._narrowmatch

2113

if not narrowmatch.always():

2114

if not narrowmatch.always():

2114

if not narrowmatch.visitdir(self._dir[:-1]):

2115

if not narrowmatch.visitdir(self._dir[:-1]):

2115

return excludedmanifestrevlog(self._dir)

2116

return excludedmanifestrevlog(self._dir)

2116

return self._manifestlog.getstorage(self._dir)

2117

return self._manifestlog.getstorage(self._dir)

2117

2118

def read(self):

2119

def read(self):

2119

if self._data is None:

2120

if self._data is None:

2120

store = self._storage()

2121

store = self._storage()

2121

if self._node == nullid:

2122

if self._node == nullid:

2122

self._data = treemanifest()

2123

self._data = treemanifest()

2123

# TODO accessing non-public API

2124

# TODO accessing non-public API

2124

elif store._treeondisk:

2125

elif store._treeondisk:

2125

m = treemanifest(dir=self._dir)

2126

m = treemanifest(dir=self._dir)

2126

2127

def gettext():

2128

def gettext():

2128

return store.revision(self._node)

2129

return store.revision(self._node)

2129

2130

def readsubtree(dir, subm):

2131

def readsubtree(dir, subm):

2131

# Set verify to False since we need to be able to create

2132

# Set verify to False since we need to be able to create

2132

# subtrees for trees that don't exist on disk.

2133

# subtrees for trees that don't exist on disk.

2133

return self._manifestlog.get(dir, subm, verify=False).read()

2134

return self._manifestlog.get(dir, subm, verify=False).read()

2134

2135

m.read(gettext, readsubtree)

2136

m.read(gettext, readsubtree)

2136

m.setnode(self._node)

2137

m.setnode(self._node)

2137

self._data = m

2138

self._data = m

2138

else:

2139

else:

2139

if self._node in store.fulltextcache:

2140

if self._node in store.fulltextcache:

2140

text = pycompat.bytestr(store.fulltextcache[self._node])

2141

text = pycompat.bytestr(store.fulltextcache[self._node])

2141

else:

2142

else:

2142

text = store.revision(self._node)

2143

text = store.revision(self._node)

2143

arraytext = bytearray(text)

2144

arraytext = bytearray(text)

2144

store.fulltextcache[self._node] = arraytext

2145

store.fulltextcache[self._node] = arraytext

2145

self._data = treemanifest(dir=self._dir, text=text)

2146

self._data = treemanifest(dir=self._dir, text=text)

2146

2147

return self._data

2148

return self._data

2148

2149

def node(self):

2150

def node(self):

2150

return self._node

2151

return self._node

2151

2152

def copy(self):

2153

def copy(self):

2153

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2154

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2154

memmf._treemanifest = self.read().copy()

2155

memmf._treemanifest = self.read().copy()

2155

return memmf

2156

return memmf

2156

2157

@propertycache

2158

@propertycache

2158

def parents(self):

2159

def parents(self):

2159

return self._storage().parents(self._node)

2160

return self._storage().parents(self._node)

2160

2161

def readdelta(self, shallow=False):

2162

def readdelta(self, shallow=False):

2162

'''Returns a manifest containing just the entries that are present

2163

'''Returns a manifest containing just the entries that are present

2163

in this manifest, but not in its p1 manifest. This is efficient to read

2164

in this manifest, but not in its p1 manifest. This is efficient to read

2164

if the revlog delta is already p1.

2165

if the revlog delta is already p1.

2165

2166

If `shallow` is True, this will read the delta for this directory,

2167

If `shallow` is True, this will read the delta for this directory,

2167

without recursively reading subdirectory manifests. Instead, any

2168

without recursively reading subdirectory manifests. Instead, any

2168

subdirectory entry will be reported as it appears in the manifest, i.e.

2169

subdirectory entry will be reported as it appears in the manifest, i.e.

2169

the subdirectory will be reported among files and distinguished only by

2170

the subdirectory will be reported among files and distinguished only by

2170

its 't' flag.

2171

its 't' flag.

2171

'''

2172

'''

2172

store = self._storage()

2173

store = self._storage()

2173

if shallow:

2174

if shallow:

2174

r = store.rev(self._node)

2175

r = store.rev(self._node)

2175

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2176

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2176

return manifestdict(d)

2177

return manifestdict(d)

2177

else:

2178

else:

2178

# Need to perform a slow delta

2179

# Need to perform a slow delta

2179

r0 = store.deltaparent(store.rev(self._node))

2180

r0 = store.deltaparent(store.rev(self._node))

2180

m0 = self._manifestlog.get(self._dir, store.node(r0)).read()

2181

m0 = self._manifestlog.get(self._dir, store.node(r0)).read()

2181

m1 = self.read()

2182

m1 = self.read()

2182

md = treemanifest(dir=self._dir)

2183

md = treemanifest(dir=self._dir)

2183

for f, ((n0, fl0), (n1, fl1)) in pycompat.iteritems(m0.diff(m1)):

2184

for f, ((n0, fl0), (n1, fl1)) in pycompat.iteritems(m0.diff(m1)):

2184

if n1:

2185

if n1:

2185

md[f] = n1

2186

md[f] = n1

2186

if fl1:

2187

if fl1:

2187

md.setflag(f, fl1)

2188

md.setflag(f, fl1)

2188

return md

2189

return md

2189

2190

def readfast(self, shallow=False):

2191

def readfast(self, shallow=False):

2191

'''Calls either readdelta or read, based on which would be less work.

2192

'''Calls either readdelta or read, based on which would be less work.

2192

readdelta is called if the delta is against the p1, and therefore can be

2193

readdelta is called if the delta is against the p1, and therefore can be

2193

read quickly.

2194

read quickly.

2194

2195

If `shallow` is True, it only returns the entries from this manifest,

2196

If `shallow` is True, it only returns the entries from this manifest,

2196

and not any submanifests.

2197

and not any submanifests.

2197

'''

2198

'''

2198

store = self._storage()

2199

store = self._storage()

2199

r = store.rev(self._node)

2200

r = store.rev(self._node)

2200

deltaparent = store.deltaparent(r)

2201

deltaparent = store.deltaparent(r)

2201

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2202

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2202

return self.readdelta(shallow=shallow)

2203

return self.readdelta(shallow=shallow)

2203

2204

if shallow:

2205

if shallow:

2205

return manifestdict(store.revision(self._node))

2206

return manifestdict(store.revision(self._node))

2206

else:

2207

else:

2207

return self.read()

2208

return self.read()

2208

2209

def find(self, key):

2210

def find(self, key):

2210

return self.read().find(key)

2211

return self.read().find(key)

2211

2212

2213

class excludeddir(treemanifest):

2214

class excludeddir(treemanifest):

2214

"""Stand-in for a directory that is excluded from the repository.

2215

"""Stand-in for a directory that is excluded from the repository.

2215

2216

With narrowing active on a repository that uses treemanifests,

2217

With narrowing active on a repository that uses treemanifests,

2217

some of the directory revlogs will be excluded from the resulting

2218

some of the directory revlogs will be excluded from the resulting

2218

clone. This is a huge storage win for clients, but means we need

2219

clone. This is a huge storage win for clients, but means we need

2219

some sort of pseudo-manifest to surface to internals so we can

2220

some sort of pseudo-manifest to surface to internals so we can

2220

detect a merge conflict outside the narrowspec. That's what this

2221

detect a merge conflict outside the narrowspec. That's what this

2221

class is: it stands in for a directory whose node is known, but

2222

class is: it stands in for a directory whose node is known, but

2222

whose contents are unknown.

2223

whose contents are unknown.

2223

"""

2224

"""

2224

2225

def __init__(self, dir, node):

2226

def __init__(self, dir, node):

2226

super(excludeddir, self).__init__(dir)

2227

super(excludeddir, self).__init__(dir)

2227

self._node = node

2228

self._node = node

2228

# Add an empty file, which will be included by iterators and such,

2229

# Add an empty file, which will be included by iterators and such,

2229

# appearing as the directory itself (i.e. something like "dir/")

2230

# appearing as the directory itself (i.e. something like "dir/")

2230

self._files[b''] = node

2231

self._files[b''] = node

2231

self._flags[b''] = b't'

2232

self._flags[b''] = b't'

2232

2233

# Manifests outside the narrowspec should never be modified, so avoid

2234

# Manifests outside the narrowspec should never be modified, so avoid

2234

# copying. This makes a noticeable difference when there are very many

2235

# copying. This makes a noticeable difference when there are very many

2235

# directories outside the narrowspec. Also, it makes sense for the copy to

2236

# directories outside the narrowspec. Also, it makes sense for the copy to

2236

# be of the same type as the original, which would not happen with the

2237

# be of the same type as the original, which would not happen with the

2237

# super type's copy().

2238

# super type's copy().

2238

def copy(self):

2239

def copy(self):

2239

return self

2240

return self

2240

2241

2242

class excludeddirmanifestctx(treemanifestctx):

2243

class excludeddirmanifestctx(treemanifestctx):

2243

"""context wrapper for excludeddir - see that docstring for rationale"""

2244

"""context wrapper for excludeddir - see that docstring for rationale"""

2244

2245

def __init__(self, dir, node):

2246

def __init__(self, dir, node):

2246

self._dir = dir

2247

self._dir = dir

2247

self._node = node

2248

self._node = node

2248

2249

def read(self):

2250

def read(self):

2250

return excludeddir(self._dir, self._node)

2251

return excludeddir(self._dir, self._node)

2251

2252

def write(self, *args):

2253

def write(self, *args):

2253

raise error.ProgrammingError(

2254

raise error.ProgrammingError(

2254

b'attempt to write manifest from excluded dir %s' % self._dir

2255

b'attempt to write manifest from excluded dir %s' % self._dir

2255

)

2256

)

2256

2257

2258

class excludedmanifestrevlog(manifestrevlog):

2259

class excludedmanifestrevlog(manifestrevlog):

2259

"""Stand-in for excluded treemanifest revlogs.

2260

"""Stand-in for excluded treemanifest revlogs.

2260

2261

When narrowing is active on a treemanifest repository, we'll have

2262

When narrowing is active on a treemanifest repository, we'll have

2262

references to directories we can't see due to the revlog being

2263

references to directories we can't see due to the revlog being

2263

skipped. This class exists to conform to the manifestrevlog

2264

skipped. This class exists to conform to the manifestrevlog

2264

interface for those directories and proactively prevent writes to

2265

interface for those directories and proactively prevent writes to

2265

outside the narrowspec.

2266

outside the narrowspec.

2266

"""

2267

"""

2267

2268

def __init__(self, dir):

2269

def __init__(self, dir):

2269

self._dir = dir

2270

self._dir = dir

2270

2271

def __len__(self):

2272

def __len__(self):

2272

raise error.ProgrammingError(

2273

raise error.ProgrammingError(

2273

b'attempt to get length of excluded dir %s' % self._dir

2274

b'attempt to get length of excluded dir %s' % self._dir

2274

)

2275

)

2275

2276

def rev(self, node):

2277

def rev(self, node):

2277

raise error.ProgrammingError(

2278

raise error.ProgrammingError(

2278

b'attempt to get rev from excluded dir %s' % self._dir

2279

b'attempt to get rev from excluded dir %s' % self._dir

2279

)

2280

)

2280

2281

def linkrev(self, node):

2282

def linkrev(self, node):

2282

raise error.ProgrammingError(

2283

raise error.ProgrammingError(

2283

b'attempt to get linkrev from excluded dir %s' % self._dir

2284

b'attempt to get linkrev from excluded dir %s' % self._dir

2284

)

2285

)

2285

2286

def node(self, rev):

2287

def node(self, rev):

2287

raise error.ProgrammingError(

2288

raise error.ProgrammingError(

2288

b'attempt to get node from excluded dir %s' % self._dir

2289

b'attempt to get node from excluded dir %s' % self._dir

2289

)

2290

)

2290

2291

def add(self, *args, **kwargs):

2292

def add(self, *args, **kwargs):

2292

# We should never write entries in dirlogs outside the narrow clone.

2293

# We should never write entries in dirlogs outside the narrow clone.

2293

# However, the method still gets called from writesubtree() in

2294

# However, the method still gets called from writesubtree() in

2294

# _addtree(), so we need to handle it. We should possibly make that

2295

# _addtree(), so we need to handle it. We should possibly make that

2295

# avoid calling add() with a clean manifest (_dirty is always False

2296

# avoid calling add() with a clean manifest (_dirty is always False

2296

# in excludeddir instances).

2297

# in excludeddir instances).

2297

pass

2298

pass

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # manifest.py - manifest revision class for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import heapq
             import itertools
             import struct
             import weakref
             from .i18n import _
             from .node import (
                 bin,
                 hex,
                 nullid,
                 nullrev,
             )
             from .pycompat import getattr
             from . import (
                 encoding,
                 error,
                 match as matchmod,
                 mdiff,
                 pathutil,
                 policy,
                 pycompat,
                 revlog,
                 util,
             )
             from .interfaces import (
                 repository,
                 util as interfaceutil,
             )
             parsers = policy.importmod('parsers')
             propertycache = util.propertycache
             # Allow tests to more easily test the alternate path in manifestdict.fastdelta()
             FASTDELTA_TEXTDIFF_THRESHOLD = 1000
             def _parse(data):
                 # This method does a little bit of excessive-looking
                 # precondition checking. This is so that the behavior of this
                 # class exactly matches its C counterpart to try and help
                 # prevent surprise breakage for anyone that develops against
                 # the pure version.
                 if data and data[-1:] != b'\n':
                     raise ValueError(b'Manifest did not end in a newline.')
                 prev = None
                 for l in data.splitlines():
                     if prev is not None and prev > l:
                         raise ValueError(b'Manifest lines not in sorted order.')
                     prev = l
                     f, n = l.split(b'\0')
                     nl = len(n)
                     if 64 < nl:
                         # modern hash, full width
                         yield f, bin(n[:64]), n[64:]
                     if 40 < nl < 45:
                         # legacy hash, always sha1
                         yield f, bin(n[:40]), n[40:]
                     else:
                         yield f, bin(n), b''
             def _text(it):
                 files = []
                 lines = []
                 for f, n, fl in it:
                     files.append(f)
                     # if this is changed to support newlines in filenames,
                     # be sure to check the templates/ dir again (especially *-raw.tmpl)
                     lines.append(b"%s\0%s%s\n" % (f, hex(n), fl))
                 _checkforbidden(files)
                 return b''.join(lines)
             class lazymanifestiter(object):
                 def __init__(self, lm):
                     self.pos = 0
                     self.lm = lm
                 def __iter__(self):
                     return self
                 def next(self):
                     try:
                         data, pos = self.lm._get(self.pos)
                     except IndexError:
                         raise StopIteration
                     if pos == -1:
                         self.pos += 1
                         return data[0]
                     self.pos += 1
                     zeropos = data.find(b'\x00', pos)
                     return data[pos:zeropos]
                 __next__ = next
             class lazymanifestiterentries(object):
                 def __init__(self, lm):
                     self.lm = lm
                     self.pos = 0
                 def __iter__(self):
                     return self
                 def next(self):
                     try:
                         data, pos = self.lm._get(self.pos)
                     except IndexError:
                         raise StopIteration
                     if pos == -1:
                         self.pos += 1
                         return data
                     zeropos = data.find(b'\x00', pos)
                     hashval = unhexlify(data, self.lm.extrainfo[self.pos], zeropos + 1, 40)
                     flags = self.lm._getflags(data, self.pos, zeropos)
                     self.pos += 1
                     return (data[pos:zeropos], hashval, flags)
                 __next__ = next
             def unhexlify(data, extra, pos, length):
                 s = bin(data[pos : pos + length])
                 if extra:
                     s += chr(extra & 0xFF)
                 return s
             def _cmp(a, b):
                 return (a > b) - (a < b)
             class _lazymanifest(object):
                 """A pure python manifest backed by a byte string.  It is supplimented with
                 internal lists as it is modified, until it is compacted back to a pure byte
                 string.
                 ``data`` is the initial manifest data.
                 ``positions`` is a list of offsets, one per manifest entry.  Positive
                 values are offsets into ``data``, negative values are offsets into the
                 ``extradata`` list.  When an entry is removed, its entry is dropped from
                 ``positions``.  The values are encoded such that when walking the list and
                 indexing into ``data`` or ``extradata`` as appropriate, the entries are
                 sorted by filename.
                 ``extradata`` is a list of (key, hash, flags) for entries that were added or
                 modified since the manifest was created or compacted.
                 """
                 def __init__(
                     self,
                     data,
                     positions=None,
                     extrainfo=None,
                     extradata=None,
                     hasremovals=False,
                 ):
                     if positions is None:
                         self.positions = self.findlines(data)
                         self.extrainfo = [0] * len(self.positions)
                         self.data = data
                         self.extradata = []
                         self.hasremovals = False
                     else:
                         self.positions = positions[:]
                         self.extrainfo = extrainfo[:]
                         self.extradata = extradata[:]
                         self.data = data
                         self.hasremovals = hasremovals
                 def findlines(self, data):
                     if not data:
                         return []
                     pos = data.find(b"\n")
                     if pos == -1 or data[-1:] != b'\n':
                         raise ValueError(b"Manifest did not end in a newline.")
                     positions = [0]
                     prev = data[: data.find(b'\x00')]
                     while pos < len(data) - 1 and pos != -1:
                         positions.append(pos + 1)
                         nexts = data[pos + 1 : data.find(b'\x00', pos + 1)]
                         if nexts < prev:
                             raise ValueError(b"Manifest lines not in sorted order.")
                         prev = nexts
                         pos = data.find(b"\n", pos + 1)
                     return positions
                 def _get(self, index):
                     # get the position encoded in pos:
                     #   positive number is an index in 'data'
                     #   negative number is in extrapieces
                     pos = self.positions[index]
                     if pos >= 0:
                         return self.data, pos
                     return self.extradata[-pos - 1], -1
                 def _getkey(self, pos):
                     if pos >= 0:
                         return self.data[pos : self.data.find(b'\x00', pos + 1)]
                     return self.extradata[-pos - 1][0]
                 def bsearch(self, key):
                     first = 0
                     last = len(self.positions) - 1
                     while first <= last:
                         midpoint = (first + last) // 2
                         nextpos = self.positions[midpoint]
                         candidate = self._getkey(nextpos)
                         r = _cmp(key, candidate)
                         if r == 0:
                             return midpoint
                         else:
                             if r < 0:
                                 last = midpoint - 1
                             else:
                                 first = midpoint + 1
                     return -1
                 def bsearch2(self, key):
                     # same as the above, but will always return the position
                     # done for performance reasons
                     first = 0
                     last = len(self.positions) - 1
                     while first <= last:
                         midpoint = (first + last) // 2
                         nextpos = self.positions[midpoint]
                         candidate = self._getkey(nextpos)
                         r = _cmp(key, candidate)
                         if r == 0:
                             return (midpoint, True)
                         else:
                             if r < 0:
                                 last = midpoint - 1
                             else:
                                 first = midpoint + 1
                     return (first, False)
                 def __contains__(self, key):
                     return self.bsearch(key) != -1
                 def _getflags(self, data, needle, pos):
                     start = pos + 41
                     end = data.find(b"\n", start)
                     if end == -1:
                         end = len(data) - 1
                     if start == end:
                         return b''
                     return self.data[start:end]
                 def __getitem__(self, key):
                     if not isinstance(key, bytes):
                         raise TypeError(b"getitem: manifest keys must be a bytes.")
                     needle = self.bsearch(key)
                     if needle == -1:
                         raise KeyError
                     data, pos = self._get(needle)
                     if pos == -1:
                         return (data[1], data[2])
                     zeropos = data.find(b'\x00', pos)
                     nlpos = data.find(b'\n', zeropos)
                     assert 0 <= needle <= len(self.positions)
                     assert len(self.extrainfo) == len(self.positions)
                     hlen = nlpos - zeropos - 1
                     # Hashes sometimes have an extra byte tucked on the end, so
                     # detect that.
                     if hlen % 2:
                         hlen -= 1
                     hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, hlen)
                     flags = self._getflags(data, needle, zeropos)
                     return (hashval, flags)
                 def __delitem__(self, key):
                     needle, found = self.bsearch2(key)
                     if not found:
                         raise KeyError
                     cur = self.positions[needle]
                     self.positions = self.positions[:needle] + self.positions[needle + 1 :]
                     self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1 :]
                     if cur >= 0:
                         # This does NOT unsort the list as far as the search functions are
                         # concerned, as they only examine lines mapped by self.positions.
                         self.data = self.data[:cur] + b'\x00' + self.data[cur + 1 :]
                         self.hasremovals = True
                 def __setitem__(self, key, value):
                     if not isinstance(key, bytes):
                         raise TypeError(b"setitem: manifest keys must be a byte string.")
                     if not isinstance(value, tuple) or len(value) != 2:
                         raise TypeError(
                             b"Manifest values must be a tuple of (node, flags)."
                         )
                     hashval = value[0]
                     # hashes are either 20 or 32 bytes (sha1 or its replacement),
                     # and allow one extra byte taht won't be persisted to disk but
                     # is sometimes used in memory.
                     if not isinstance(hashval, bytes) or not (
 <= len(hashval) <= 22 or 32 <= len(hashval) <= 34
                     ):
                         raise TypeError(b"node must be a 20-byte or 32-byte byte string")
                     flags = value[1]
                     if len(hashval) == 22:
                         hashval = hashval[:-1]
                     if not isinstance(flags, bytes) or len(flags) > 1:
                         raise TypeError(b"flags must a 0 or 1 byte string, got %r", flags)
                     needle, found = self.bsearch2(key)
                     if found:
                         # put the item
                         pos = self.positions[needle]
                         if pos < 0:
                             self.extradata[-pos - 1] = (key, hashval, value[1])
                         else:
                             # just don't bother
                             self.extradata.append((key, hashval, value[1]))
                             self.positions[needle] = -len(self.extradata)
                     else:
                         # not found, put it in with extra positions
                         self.extradata.append((key, hashval, value[1]))
                         self.positions = (
                             self.positions[:needle]
                             + [-len(self.extradata)]
                             + self.positions[needle:]
                         )
                         self.extrainfo = (
                             self.extrainfo[:needle] + [0] + self.extrainfo[needle:]
                         )
                 def copy(self):
                     # XXX call _compact like in C?
                     return _lazymanifest(
                         self.data,
                         self.positions,
                         self.extrainfo,
                         self.extradata,
                         self.hasremovals,
                     )
                 def _compact(self):
                     # hopefully not called TOO often
                     if len(self.extradata) == 0 and not self.hasremovals:
                         return
                     l = []
                     i = 0
                     offset = 0
                     self.extrainfo = [0] * len(self.positions)
                     while i < len(self.positions):
                         if self.positions[i] >= 0:
                             cur = self.positions[i]
                             last_cut = cur
                             # Collect all contiguous entries in the buffer at the current
                             # offset, breaking out only for added/modified items held in
                             # extradata, or a deleted line prior to the next position.
                             while True:
                                 self.positions[i] = offset
                                 i += 1
                                 if i == len(self.positions) or self.positions[i] < 0:
                                     break
                                 # A removed file has no positions[] entry, but does have an
                                 # overwritten first byte.  Break out and find the end of the
                                 # current good entry/entries if there is a removed file
                                 # before the next position.
                                 if (
                                     self.hasremovals
                                     and self.data.find(b'\n\x00', cur, self.positions[i])
                                     != -1
                                 ):
                                     break
                                 offset += self.positions[i] - cur
                                 cur = self.positions[i]
                             end_cut = self.data.find(b'\n', cur)
                             if end_cut != -1:
                                 end_cut += 1
                             offset += end_cut - cur
                             l.append(self.data[last_cut:end_cut])
                         else:
                             while i < len(self.positions) and self.positions[i] < 0:
                                 cur = self.positions[i]
                                 t = self.extradata[-cur - 1]
                                 l.append(self._pack(t))
                                 self.positions[i] = offset
                                 # Hashes are either 20 bytes (old sha1s) or 32
                                 # bytes (new non-sha1).
                                 hlen = 20
                                 if len(t[1]) > 25:
                                     hlen = 32
                                 if len(t[1]) > hlen:
                                     self.extrainfo[i] = ord(t[1][hlen + 1])
                                 offset += len(l[-1])
                                 i += 1
                     self.data = b''.join(l)
                     self.hasremovals = False
                     self.extradata = []
                 def _pack(self, d):
                     n = d[1]
                     if len(n) == 21 or len(n) == 33:
                         n = n[:-1]
                     assert len(n) == 20 or len(n) == 32
                     return d[0] + b'\x00' + hex(n) + d[2] + b'\n'
                 def text(self):
                     self._compact()
                     return self.data
                 def diff(self, m2, clean=False):
                     '''Finds changes between the current manifest and m2.'''
                     # XXX think whether efficiency matters here
                     diff = {}
                     for fn, e1, flags in self.iterentries():
                         if fn not in m2:
                             diff[fn] = (e1, flags), (None, b'')
                         else:
                             e2 = m2[fn]
                             if (e1, flags) != e2:
                                 diff[fn] = (e1, flags), e2
                             elif clean:
                                 diff[fn] = None
                     for fn, e2, flags in m2.iterentries():
                         if fn not in self:
                             diff[fn] = (None, b''), (e2, flags)
                     return diff
                 def iterentries(self):
                     return lazymanifestiterentries(self)
                 def iterkeys(self):
                     return lazymanifestiter(self)
                 def __iter__(self):
                     return lazymanifestiter(self)
                 def __len__(self):
                     return len(self.positions)
                 def filtercopy(self, filterfn):
                     # XXX should be optimized
                     c = _lazymanifest(b'')
                     for f, n, fl in self.iterentries():
                         if filterfn(f):
                             c[f] = n, fl
                     return c
             try:
                 _lazymanifest = parsers.lazymanifest
             except AttributeError:
                 pass
             @interfaceutil.implementer(repository.imanifestdict)
             class manifestdict(object):
                 def __init__(self, data=b''):
                     self._lm = _lazymanifest(data)
                 def __getitem__(self, key):
                     return self._lm[key][0]
                 def find(self, key):
                     return self._lm[key]
                 def __len__(self):
                     return len(self._lm)
                 def __nonzero__(self):
                     # nonzero is covered by the __len__ function, but implementing it here
                     # makes it easier for extensions to override.
                     return len(self._lm) != 0
                 __bool__ = __nonzero__
                 def __setitem__(self, key, node):
                     self._lm[key] = node, self.flags(key)
                 def __contains__(self, key):
                     if key is None:
                         return False
                     return key in self._lm
                 def __delitem__(self, key):
                     del self._lm[key]
                 def __iter__(self):
                     return self._lm.__iter__()
                 def iterkeys(self):
                     return self._lm.iterkeys()
                 def keys(self):
                     return list(self.iterkeys())
                 def filesnotin(self, m2, match=None):
                     '''Set of files in this manifest that are not in the other'''
                     if match is not None:
                         match = matchmod.badmatch(match, lambda path, msg: None)
                         sm2 = set(m2.walk(match))
                         return {f for f in self.walk(match) if f not in sm2}
                     return {f for f in self if f not in m2}
                 @propertycache
                 def _dirs(self):
                     return pathutil.dirs(self)
                 def dirs(self):
                     return self._dirs
                 def hasdir(self, dir):
                     return dir in self._dirs
                 def _filesfastpath(self, match):
                     '''Checks whether we can correctly and quickly iterate over matcher
                     files instead of over manifest files.'''
                     files = match.files()
                     return len(files) < 100 and (
                         match.isexact()
                         or (match.prefix() and all(fn in self for fn in files))
                     )
                 def walk(self, match):
                     '''Generates matching file names.
                     Equivalent to manifest.matches(match).iterkeys(), but without creating
                     an entirely new manifest.
                     It also reports nonexistent files by marking them bad with match.bad().
                     '''
                     if match.always():
                         for f in iter(self):
                             yield f
                         return
                     fset = set(match.files())
                     # avoid the entire walk if we're only looking for specific files
                     if self._filesfastpath(match):
                         for fn in sorted(fset):
                             if fn in self:
                                 yield fn
                         return
                     for fn in self:
                         if fn in fset:
                             # specified pattern is the exact name
                             fset.remove(fn)
                         if match(fn):
                             yield fn
                     # for dirstate.walk, files=[''] means "walk the whole tree".
                     # follow that here, too
                     fset.discard(b'')
                     for fn in sorted(fset):
                         if not self.hasdir(fn):
                             match.bad(fn, None)
                 def _matches(self, match):
                     '''generate a new manifest filtered by the match argument'''
                     if match.always():
                         return self.copy()
                     if self._filesfastpath(match):
                         m = manifestdict()
                         lm = self._lm
                         for fn in match.files():
                             if fn in lm:
                                 m._lm[fn] = lm[fn]
                         return m
                     m = manifestdict()
                     m._lm = self._lm.filtercopy(match)
                     return m
                 def diff(self, m2, match=None, clean=False):
                     '''Finds changes between the current manifest and m2.
                     Args:
                       m2: the manifest to which this manifest should be compared.
                       clean: if true, include files unchanged between these manifests
                              with a None value in the returned dictionary.
                     The result is returned as a dict with filename as key and
                     values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
                     nodeid in the current/other manifest and fl1/fl2 is the flag
                     in the current/other manifest. Where the file does not exist,
                     the nodeid will be None and the flags will be the empty
                     string.
                     '''
                     if match:
                         m1 = self._matches(match)
                         m2 = m2._matches(match)
                         return m1.diff(m2, clean=clean)
                     return self._lm.diff(m2._lm, clean)
                 def setflag(self, key, flag):
                     self._lm[key] = self[key], flag
                 def get(self, key, default=None):
                     try:
                         return self._lm[key][0]
                     except KeyError:
                         return default
                 def flags(self, key):
                     try:
                         return self._lm[key][1]
                     except KeyError:
                         return b''
                 def copy(self):
                     c = manifestdict()
                     c._lm = self._lm.copy()
                     return c
                 def items(self):
                     return (x[:2] for x in self._lm.iterentries())
                 def iteritems(self):
                     return (x[:2] for x in self._lm.iterentries())
                 def iterentries(self):
                     return self._lm.iterentries()
                 def text(self):
                     # most likely uses native version
                     return self._lm.text()
                 def fastdelta(self, base, changes):
                     """Given a base manifest text as a bytearray and a list of changes
                     relative to that text, compute a delta that can be used by revlog.
                     """
                     delta = []
                     dstart = None
                     dend = None
                     dline = [b""]
                     start = 0
                     # zero copy representation of base as a buffer
                     addbuf = util.buffer(base)
                     changes = list(changes)
                     if len(changes) < FASTDELTA_TEXTDIFF_THRESHOLD:
                         # start with a readonly loop that finds the offset of
                         # each line and creates the deltas
                         for f, todelete in changes:
                             # bs will either be the index of the item or the insert point
                             start, end = _msearch(addbuf, f, start)
                             if not todelete:
                                 h, fl = self._lm[f]
                                 l = b"%s\0%s%s\n" % (f, hex(h), fl)
                             else:
                                 if start == end:
                                     # item we want to delete was not found, error out
                                     raise AssertionError(
                                         _(b"failed to remove %s from manifest") % f
                                     )
                                 l = b""
                             if dstart is not None and dstart <= start and dend >= start:
                                 if dend < end:
                                     dend = end
                                 if l:
                                     dline.append(l)
                             else:
                                 if dstart is not None:
                                     delta.append([dstart, dend, b"".join(dline)])
                                 dstart = start
                                 dend = end
                                 dline = [l]
                         if dstart is not None:
                             delta.append([dstart, dend, b"".join(dline)])
                         # apply the delta to the base, and get a delta for addrevision
                         deltatext, arraytext = _addlistdelta(base, delta)
                     else:
                         # For large changes, it's much cheaper to just build the text and
                         # diff it.
                         arraytext = bytearray(self.text())
                         deltatext = mdiff.textdiff(
                             util.buffer(base), util.buffer(arraytext)
                         )
                     return arraytext, deltatext
             def _msearch(m, s, lo=0, hi=None):
                 '''return a tuple (start, end) that says where to find s within m.
                 If the string is found m[start:end] are the line containing
                 that string.  If start == end the string was not found and
                 they indicate the proper sorted insertion point.
                 m should be a buffer, a memoryview or a byte string.
                 s is a byte string'''
                 def advance(i, c):
                     while i < lenm and m[i : i + 1] != c:
                         i += 1
                     return i
                 if not s:
                     return (lo, lo)
                 lenm = len(m)
                 if not hi:
                     hi = lenm
                 while lo < hi:
                     mid = (lo + hi) // 2
                     start = mid
                     while start > 0 and m[start - 1 : start] != b'\n':
                         start -= 1
                     end = advance(start, b'\0')
                     if bytes(m[start:end]) < s:
                         # we know that after the null there are 40 bytes of sha1
                         # this translates to the bisect lo = mid + 1
                         lo = advance(end + 40, b'\n') + 1
                     else:
                         # this translates to the bisect hi = mid
                         hi = start
                 end = advance(lo, b'\0')
                 found = m[lo:end]
                 if s == found:
                     # we know that after the null there are 40 bytes of sha1
                     end = advance(end + 40, b'\n')
                     return (lo, end + 1)
                 else:
                     return (lo, lo)
             def _checkforbidden(l):
                 """Check filenames for illegal characters."""
                 for f in l:
                     if b'\n' in f or b'\r' in f:
                         raise error.StorageError(
                             _(b"'\\n' and '\\r' disallowed in filenames: %r")
                             % pycompat.bytestr(f)
                         )
             # apply the changes collected during the bisect loop to our addlist
             # return a delta suitable for addrevision
             def _addlistdelta(addlist, x):
                 # for large addlist arrays, building a new array is cheaper
                 # than repeatedly modifying the existing one
                 currentposition = 0
                 newaddlist = bytearray()
                 for start, end, content in x:
                     newaddlist += addlist[currentposition:start]
                     if content:
                         newaddlist += bytearray(content)
                     currentposition = end
                 newaddlist += addlist[currentposition:]
                 deltatext = b"".join(
                     struct.pack(b">lll", start, end, len(content)) + content
                     for start, end, content in x
                 )
                 return deltatext, newaddlist
             def _splittopdir(f):
                 if b'/' in f:
                     dir, subpath = f.split(b'/', 1)
                     return dir + b'/', subpath
                 else:
                     return b'', f
             _noop = lambda s: None
             @interfaceutil.implementer(repository.imanifestdict)
             class treemanifest(object):
                 def __init__(self, dir=b'', text=b''):
                     self._dir = dir
                     self._node = nullid
                     self._loadfunc = _noop
                     self._copyfunc = _noop
                     self._dirty = False
                     self._dirs = {}
                     self._lazydirs = {}
                     # Using _lazymanifest here is a little slower than plain old dicts
                     self._files = {}
                     self._flags = {}
                     if text:
                         def readsubtree(subdir, subm):
                             raise AssertionError(
                                 b'treemanifest constructor only accepts flat manifests'
                             )
                         self.parse(text, readsubtree)
                         self._dirty = True  # Mark flat manifest dirty after parsing
                 def _subpath(self, path):
                     return self._dir + path
                 def _loadalllazy(self):
                     selfdirs = self._dirs
                     for d, (path, node, readsubtree, docopy) in pycompat.iteritems(
                         self._lazydirs
                     ):
                         if docopy:
                             selfdirs[d] = readsubtree(path, node).copy()
                         else:
                             selfdirs[d] = readsubtree(path, node)
                     self._lazydirs = {}
                 def _loadlazy(self, d):
                     v = self._lazydirs.get(d)
                     if v:
                         path, node, readsubtree, docopy = v
                         if docopy:
                             self._dirs[d] = readsubtree(path, node).copy()
                         else:
                             self._dirs[d] = readsubtree(path, node)
                         del self._lazydirs[d]
                 def _loadchildrensetlazy(self, visit):
                     if not visit:
                         return None
                     if visit == b'all' or visit == b'this':
                         self._loadalllazy()
                         return None
                     loadlazy = self._loadlazy
                     for k in visit:
                         loadlazy(k + b'/')
                     return visit
                 def _loaddifflazy(self, t1, t2):
                     """load items in t1 and t2 if they're needed for diffing.
                     The criteria currently is:
                     - if it's not present in _lazydirs in either t1 or t2, load it in the
                       other (it may already be loaded or it may not exist, doesn't matter)
                     - if it's present in _lazydirs in both, compare the nodeid; if it
                       differs, load it in both
                     """
                     toloadlazy = []
                     for d, v1 in pycompat.iteritems(t1._lazydirs):
                         v2 = t2._lazydirs.get(d)
                         if not v2 or v2[1] != v1[1]:
                             toloadlazy.append(d)
                     for d, v1 in pycompat.iteritems(t2._lazydirs):
                         if d not in t1._lazydirs:
                             toloadlazy.append(d)
                     for d in toloadlazy:
                         t1._loadlazy(d)
                         t2._loadlazy(d)
                 def __len__(self):
                     self._load()
                     size = len(self._files)
                     self._loadalllazy()
                     for m in self._dirs.values():
                         size += m.__len__()
                     return size
                 def __nonzero__(self):
                     # Faster than "__len() != 0" since it avoids loading sub-manifests
                     return not self._isempty()
                 __bool__ = __nonzero__
                 def _isempty(self):
                     self._load()  # for consistency; already loaded by all callers
                     # See if we can skip loading everything.
                     if self._files or (
                         self._dirs and any(not m._isempty() for m in self._dirs.values())
                     ):
                         return False
                     self._loadalllazy()
                     return not self._dirs or all(m._isempty() for m in self._dirs.values())
                 @encoding.strmethod
                 def __repr__(self):
                     return (
                         b'<treemanifest dir=%s, node=%s, loaded=%r, dirty=%r at 0x%x>'
                         % (
                             self._dir,
                             hex(self._node),
                             bool(self._loadfunc is _noop),
                             self._dirty,
                             id(self),
                         )
                     )
                 def dir(self):
                     '''The directory that this tree manifest represents, including a
                     trailing '/'. Empty string for the repo root directory.'''
                     return self._dir
                 def node(self):
                     '''This node of this instance. nullid for unsaved instances. Should
                     be updated when the instance is read or written from a revlog.
                     '''
                     assert not self._dirty
                     return self._node
                 def setnode(self, node):
                     self._node = node
                     self._dirty = False
                 def iterentries(self):
                     self._load()
                     self._loadalllazy()
                     for p, n in sorted(
                         itertools.chain(self._dirs.items(), self._files.items())
                     ):
                         if p in self._files:
                             yield self._subpath(p), n, self._flags.get(p, b'')
                         else:
                             for x in n.iterentries():
                                 yield x
                 def items(self):
                     self._load()
                     self._loadalllazy()
                     for p, n in sorted(
                         itertools.chain(self._dirs.items(), self._files.items())
                     ):
                         if p in self._files:
                             yield self._subpath(p), n
                         else:
                             for f, sn in pycompat.iteritems(n):
                                 yield f, sn
                 iteritems = items
                 def iterkeys(self):
                     self._load()
                     self._loadalllazy()
                     for p in sorted(itertools.chain(self._dirs, self._files)):
                         if p in self._files:
                             yield self._subpath(p)
                         else:
                             for f in self._dirs[p]:
                                 yield f
                 def keys(self):
                     return list(self.iterkeys())
                 def __iter__(self):
                     return self.iterkeys()
                 def __contains__(self, f):
                     if f is None:
                         return False
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             return False
                         return self._dirs[dir].__contains__(subpath)
                     else:
                         return f in self._files
                 def get(self, f, default=None):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             return default
                         return self._dirs[dir].get(subpath, default)
                     else:
                         return self._files.get(f, default)
                 def __getitem__(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         return self._dirs[dir].__getitem__(subpath)
                     else:
                         return self._files[f]
                 def flags(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             return b''
                         return self._dirs[dir].flags(subpath)
                     else:
                         if f in self._lazydirs or f in self._dirs:
                             return b''
                         return self._flags.get(f, b'')
                 def find(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         return self._dirs[dir].find(subpath)
                     else:
                         return self._files[f], self._flags.get(f, b'')
                 def __delitem__(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         self._dirs[dir].__delitem__(subpath)
                         # If the directory is now empty, remove it
                         if self._dirs[dir]._isempty():
                             del self._dirs[dir]
                     else:
                         del self._files[f]
                         if f in self._flags:
                             del self._flags[f]
                     self._dirty = True
                 def __setitem__(self, f, n):
                     assert n is not None
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             self._dirs[dir] = treemanifest(self._subpath(dir))
                         self._dirs[dir].__setitem__(subpath, n)
                     else:
                         # manifest nodes are either 20 bytes or 32 bytes,
                         # depending on the hash in use. An extra byte is
                         # occasionally used by hg, but won't ever be
                         # persisted. Trim to 21 or 33 bytes as appropriate.
                         trim = 21 if len(n) < 25 else 33
                         self._files[f] = n[:trim]  # to match manifestdict's behavior
                     self._dirty = True
                 def _load(self):
                     if self._loadfunc is not _noop:
                         lf, self._loadfunc = self._loadfunc, _noop
                         lf(self)
                     elif self._copyfunc is not _noop:
                         cf, self._copyfunc = self._copyfunc, _noop
                         cf(self)
                 def setflag(self, f, flags):
                     """Set the flags (symlink, executable) for path f."""
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             self._dirs[dir] = treemanifest(self._subpath(dir))
                         self._dirs[dir].setflag(subpath, flags)
                     else:
                         self._flags[f] = flags
                     self._dirty = True
                 def copy(self):
                     copy = treemanifest(self._dir)
                     copy._node = self._node
                     copy._dirty = self._dirty
                     if self._copyfunc is _noop:
                         def _copyfunc(s):
                             self._load()
                             s._lazydirs = {
                                 d: (p, n, r, True)
                                 for d, (p, n, r, c) in pycompat.iteritems(self._lazydirs)
                             }
                             sdirs = s._dirs
                             for d, v in pycompat.iteritems(self._dirs):
                                 sdirs[d] = v.copy()
                             s._files = dict.copy(self._files)
                             s._flags = dict.copy(self._flags)
                         if self._loadfunc is _noop:
                             _copyfunc(copy)
                         else:
                             copy._copyfunc = _copyfunc
                     else:
                         copy._copyfunc = self._copyfunc
                     return copy
                 def filesnotin(self, m2, match=None):
                     '''Set of files in this manifest that are not in the other'''
                     if match and not match.always():
                         m1 = self._matches(match)
                         m2 = m2._matches(match)
                         return m1.filesnotin(m2)
                     files = set()
                     def _filesnotin(t1, t2):
                         if t1._node == t2._node and not t1._dirty and not t2._dirty:
                             return
                         t1._load()
                         t2._load()
                         self._loaddifflazy(t1, t2)
                         for d, m1 in pycompat.iteritems(t1._dirs):
                             if d in t2._dirs:
                                 m2 = t2._dirs[d]
                                 _filesnotin(m1, m2)
                             else:
                                 files.update(m1.iterkeys())
                         for fn in t1._files:
                             if fn not in t2._files:
                                 files.add(t1._subpath(fn))
                     _filesnotin(self, m2)
                     return files
                 @propertycache
                 def _alldirs(self):
                     return pathutil.dirs(self)
                 def dirs(self):
                     return self._alldirs
                 def hasdir(self, dir):
                     self._load()
                     topdir, subdir = _splittopdir(dir)
                     if topdir:
                         self._loadlazy(topdir)
                         if topdir in self._dirs:
                             return self._dirs[topdir].hasdir(subdir)
                         return False
                     dirslash = dir + b'/'
                     return dirslash in self._dirs or dirslash in self._lazydirs
                 def walk(self, match):
                     '''Generates matching file names.
                     It also reports nonexistent files by marking them bad with match.bad().
                     '''
                     if match.always():
                         for f in iter(self):
                             yield f
                         return
                     fset = set(match.files())
                     for fn in self._walk(match):
                         if fn in fset:
                             # specified pattern is the exact name
                             fset.remove(fn)
                         yield fn
                     # for dirstate.walk, files=[''] means "walk the whole tree".
                     # follow that here, too
                     fset.discard(b'')
                     for fn in sorted(fset):
                         if not self.hasdir(fn):
                             match.bad(fn, None)
                 def _walk(self, match):
                     '''Recursively generates matching file names for walk().'''
                     visit = match.visitchildrenset(self._dir[:-1])
                     if not visit:
                         return
                     # yield this dir's files and walk its submanifests
                     self._load()
                     visit = self._loadchildrensetlazy(visit)
                     for p in sorted(list(self._dirs) + list(self._files)):
                         if p in self._files:
                             fullp = self._subpath(p)
                             if match(fullp):
                                 yield fullp
                         else:
                             if not visit or p[:-1] in visit:
                                 for f in self._dirs[p]._walk(match):
                                     yield f
                 def _matches(self, match):
                     '''recursively generate a new manifest filtered by the match argument.
                     '''
                     if match.always():
                         return self.copy()
                     return self._matches_inner(match)
                 def _matches_inner(self, match):
                     if match.always():
                         return self.copy()
                     visit = match.visitchildrenset(self._dir[:-1])
                     if visit == b'all':
                         return self.copy()
                     ret = treemanifest(self._dir)
                     if not visit:
                         return ret
                     self._load()
                     for fn in self._files:
                         # While visitchildrenset *usually* lists only subdirs, this is
                         # actually up to the matcher and may have some files in the set().
                         # If visit == 'this', we should obviously look at the files in this
                         # directory; if visit is a set, and fn is in it, we should inspect
                         # fn (but no need to inspect things not in the set).
                         if visit != b'this' and fn not in visit:
                             continue
                         fullp = self._subpath(fn)
                         # visitchildrenset isn't perfect, we still need to call the regular
                         # matcher code to further filter results.
                         if not match(fullp):
                             continue
                         ret._files[fn] = self._files[fn]
                         if fn in self._flags:
                             ret._flags[fn] = self._flags[fn]
                     visit = self._loadchildrensetlazy(visit)
                     for dir, subm in pycompat.iteritems(self._dirs):
                         if visit and dir[:-1] not in visit:
                             continue
                         m = subm._matches_inner(match)
                         if not m._isempty():
                             ret._dirs[dir] = m
                     if not ret._isempty():
                         ret._dirty = True
                     return ret
                 def fastdelta(self, base, changes):
                     raise FastdeltaUnavailable()
                 def diff(self, m2, match=None, clean=False):
                     '''Finds changes between the current manifest and m2.
                     Args:
                       m2: the manifest to which this manifest should be compared.
                       clean: if true, include files unchanged between these manifests
                              with a None value in the returned dictionary.
                     The result is returned as a dict with filename as key and
                     values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
                     nodeid in the current/other manifest and fl1/fl2 is the flag
                     in the current/other manifest. Where the file does not exist,
                     the nodeid will be None and the flags will be the empty
                     string.
                     '''
                     if match and not match.always():
                         m1 = self._matches(match)
                         m2 = m2._matches(match)
                         return m1.diff(m2, clean=clean)
                     result = {}
                     emptytree = treemanifest()
                     def _iterativediff(t1, t2, stack):
                         """compares two tree manifests and append new tree-manifests which
                         needs to be compared to stack"""
                         if t1._node == t2._node and not t1._dirty and not t2._dirty:
                             return
                         t1._load()
                         t2._load()
                         self._loaddifflazy(t1, t2)
                         for d, m1 in pycompat.iteritems(t1._dirs):
                             m2 = t2._dirs.get(d, emptytree)
                             stack.append((m1, m2))
                         for d, m2 in pycompat.iteritems(t2._dirs):
                             if d not in t1._dirs:
                                 stack.append((emptytree, m2))
                         for fn, n1 in pycompat.iteritems(t1._files):
                             fl1 = t1._flags.get(fn, b'')
                             n2 = t2._files.get(fn, None)
                             fl2 = t2._flags.get(fn, b'')
                             if n1 != n2 or fl1 != fl2:
                                 result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))
                             elif clean:
                                 result[t1._subpath(fn)] = None
                         for fn, n2 in pycompat.iteritems(t2._files):
                             if fn not in t1._files:
                                 fl2 = t2._flags.get(fn, b'')
                                 result[t2._subpath(fn)] = ((None, b''), (n2, fl2))
                     stackls = []
                     _iterativediff(self, m2, stackls)
                     while stackls:
                         t1, t2 = stackls.pop()
                         # stackls is populated in the function call
                         _iterativediff(t1, t2, stackls)
                     return result
                 def unmodifiedsince(self, m2):
                     return not self._dirty and not m2._dirty and self._node == m2._node
                 def parse(self, text, readsubtree):
                     selflazy = self._lazydirs
                     subpath = self._subpath
                     for f, n, fl in _parse(text):
                         if fl == b't':
                             f = f + b'/'
                             # False below means "doesn't need to be copied" and can use the
                             # cached value from readsubtree directly.
                             selflazy[f] = (subpath(f), n, readsubtree, False)
                         elif b'/' in f:
                             # This is a flat manifest, so use __setitem__ and setflag rather
                             # than assigning directly to _files and _flags, so we can
                             # assign a path in a subdirectory, and to mark dirty (compared
                             # to nullid).
                             self[f] = n
                             if fl:
                                 self.setflag(f, fl)
                         else:
                             # Assigning to _files and _flags avoids marking as dirty,
                             # and should be a little faster.
                             self._files[f] = n
                             if fl:
                                 self._flags[f] = fl
                 def text(self):
                     """Get the full data of this manifest as a bytestring."""
                     self._load()
                     return _text(self.iterentries())
                 def dirtext(self):
                     """Get the full data of this directory as a bytestring. Make sure that
                     any submanifests have been written first, so their nodeids are correct.
                     """
                     self._load()
                     flags = self.flags
                     lazydirs = [
                         (d[:-1], v[1], b't') for d, v in pycompat.iteritems(self._lazydirs)
                     ]
                     dirs = [(d[:-1], self._dirs[d]._node, b't') for d in self._dirs]
                     files = [(f, self._files[f], flags(f)) for f in self._files]
                     return _text(sorted(dirs + files + lazydirs))
                 def read(self, gettext, readsubtree):
                     def _load_for_read(s):
                         s.parse(gettext(), readsubtree)
                         s._dirty = False
                     self._loadfunc = _load_for_read
                 def writesubtrees(self, m1, m2, writesubtree, match):
                     self._load()  # for consistency; should never have any effect here
                     m1._load()
                     m2._load()
                     emptytree = treemanifest()
                     def getnode(m, d):
                         ld = m._lazydirs.get(d)
                         if ld:
                             return ld[1]
                         return m._dirs.get(d, emptytree)._node
                     # let's skip investigating things that `match` says we do not need.
                     visit = match.visitchildrenset(self._dir[:-1])
                     visit = self._loadchildrensetlazy(visit)
                     if visit == b'this' or visit == b'all':
                         visit = None
                     for d, subm in pycompat.iteritems(self._dirs):
                         if visit and d[:-1] not in visit:
                             continue
                         subp1 = getnode(m1, d)
                         subp2 = getnode(m2, d)
                         if subp1 == nullid:
                             subp1, subp2 = subp2, subp1
                         writesubtree(subm, subp1, subp2, match)
                 def walksubtrees(self, matcher=None):
                     """Returns an iterator of the subtrees of this manifest, including this
                     manifest itself.
                     If `matcher` is provided, it only returns subtrees that match.
                     """
                     if matcher and not matcher.visitdir(self._dir[:-1]):
                         return
                     if not matcher or matcher(self._dir[:-1]):
                         yield self
                     self._load()
                     # OPT: use visitchildrenset to avoid loading everything.
                     self._loadalllazy()
                     for d, subm in pycompat.iteritems(self._dirs):
                         for subtree in subm.walksubtrees(matcher=matcher):
                             yield subtree
             class manifestfulltextcache(util.lrucachedict):
                 """File-backed LRU cache for the manifest cache
                 File consists of entries, up to EOF:
                 - 20 bytes node, 4 bytes length, <length> manifest data
                 These are written in reverse cache order (oldest to newest).
                 """
                 _file = b'manifestfulltextcache'
                 def __init__(self, max):
                     super(manifestfulltextcache, self).__init__(max)
                     self._dirty = False
                     self._read = False
                     self._opener = None
                 def read(self):
                     if self._read or self._opener is None:
                         return
                     try:
                         with self._opener(self._file) as fp:
                             set = super(manifestfulltextcache, self).__setitem__
                             # ignore trailing data, this is a cache, corruption is skipped
                             while True:
+                                # TODO do we need to do work here for sha1 portability?
                                 node = fp.read(20)
                                 if len(node) < 20:
                                     break
                                 try:
                                     size = struct.unpack(b'>L', fp.read(4))[0]
                                 except struct.error:
                                     break
                                 value = bytearray(fp.read(size))
                                 if len(value) != size:
                                     break
                                 set(node, value)
                     except IOError:
                         # the file is allowed to be missing
                         pass
                     self._read = True
                     self._dirty = False
                 def write(self):
                     if not self._dirty or self._opener is None:
                         return
                     # rotate backwards to the first used node
                     with self._opener(
                         self._file, b'w', atomictemp=True, checkambig=True
                     ) as fp:
                         node = self._head.prev
                         while True:
                             if node.key in self._cache:
                                 fp.write(node.key)
                                 fp.write(struct.pack(b'>L', len(node.value)))
                                 fp.write(node.value)
                             if node is self._head:
                                 break
                             node = node.prev
                 def __len__(self):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).__len__()
                 def __contains__(self, k):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).__contains__(k)
                 def __iter__(self):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).__iter__()
                 def __getitem__(self, k):
                     if not self._read:
                         self.read()
                     # the cache lru order can change on read
                     setdirty = self._cache.get(k) is not self._head
                     value = super(manifestfulltextcache, self).__getitem__(k)
                     if setdirty:
                         self._dirty = True
                     return value
                 def __setitem__(self, k, v):
                     if not self._read:
                         self.read()
                     super(manifestfulltextcache, self).__setitem__(k, v)
                     self._dirty = True
                 def __delitem__(self, k):
                     if not self._read:
                         self.read()
                     super(manifestfulltextcache, self).__delitem__(k)
                     self._dirty = True
                 def get(self, k, default=None):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).get(k, default=default)
                 def clear(self, clear_persisted_data=False):
                     super(manifestfulltextcache, self).clear()
                     if clear_persisted_data:
                         self._dirty = True
                         self.write()
                     self._read = False
             # and upper bound of what we expect from compression
             # (real live value seems to be "3")
             MAXCOMPRESSION = 3
             class FastdeltaUnavailable(Exception):
                 """Exception raised when fastdelta isn't usable on a manifest."""
             @interfaceutil.implementer(repository.imanifeststorage)
             class manifestrevlog(object):
                 '''A revlog that stores manifest texts. This is responsible for caching the
                 full-text manifest contents.
                 '''
                 def __init__(
                     self,
                     opener,
                     tree=b'',
                     dirlogcache=None,
                     indexfile=None,
                     treemanifest=False,
                 ):
                     """Constructs a new manifest revlog
                     `indexfile` - used by extensions to have two manifests at once, like
                     when transitioning between flatmanifeset and treemanifests.
                     `treemanifest` - used to indicate this is a tree manifest revlog. Opener
                     options can also be used to make this a tree manifest revlog. The opener
                     option takes precedence, so if it is set to True, we ignore whatever
                     value is passed in to the constructor.
                     """
                     # During normal operations, we expect to deal with not more than four
                     # revs at a time (such as during commit --amend). When rebasing large
                     # stacks of commits, the number can go up, hence the config knob below.
                     cachesize = 4
                     optiontreemanifest = False
                     opts = getattr(opener, 'options', None)
                     if opts is not None:
                         cachesize = opts.get(b'manifestcachesize', cachesize)
                         optiontreemanifest = opts.get(b'treemanifest', False)
                     self._treeondisk = optiontreemanifest or treemanifest
                     self._fulltextcache = manifestfulltextcache(cachesize)
                     if tree:
                         assert self._treeondisk, b'opts is %r' % opts
                     if indexfile is None:
                         indexfile = b'00manifest.i'
                         if tree:
                             indexfile = b"meta/" + tree + indexfile
                     self.tree = tree
                     # The dirlogcache is kept on the root manifest log
                     if tree:
                         self._dirlogcache = dirlogcache
                     else:
                         self._dirlogcache = {b'': self}
                     self._revlog = revlog.revlog(
                         opener,
                         indexfile,
                         # only root indexfile is cached
                         checkambig=not bool(tree),
                         mmaplargeindex=True,
                         upperboundcomp=MAXCOMPRESSION,
                     )
                     self.index = self._revlog.index
                     self.version = self._revlog.version
                     self._generaldelta = self._revlog._generaldelta
                 def _setupmanifestcachehooks(self, repo):
                     """Persist the manifestfulltextcache on lock release"""
                     if not util.safehasattr(repo, b'_wlockref'):
                         return
                     self._fulltextcache._opener = repo.wcachevfs
                     if repo._currentlock(repo._wlockref) is None:
                         return
                     reporef = weakref.ref(repo)
                     manifestrevlogref = weakref.ref(self)
                     def persistmanifestcache(success):
                         # Repo is in an unknown state, do not persist.
                         if not success:
                             return
                         repo = reporef()
                         self = manifestrevlogref()
                         if repo is None or self is None:
                             return
                         if repo.manifestlog.getstorage(b'') is not self:
                             # there's a different manifest in play now, abort
                             return
                         self._fulltextcache.write()
                     repo._afterlock(persistmanifestcache)
                 @property
                 def fulltextcache(self):
                     return self._fulltextcache
                 def clearcaches(self, clear_persisted_data=False):
                     self._revlog.clearcaches()
                     self._fulltextcache.clear(clear_persisted_data=clear_persisted_data)
                     self._dirlogcache = {self.tree: self}
                 def dirlog(self, d):
                     if d:
                         assert self._treeondisk
                     if d not in self._dirlogcache:
                         mfrevlog = manifestrevlog(
                             self.opener, d, self._dirlogcache, treemanifest=self._treeondisk
                         )
                         self._dirlogcache[d] = mfrevlog
                     return self._dirlogcache[d]
                 def add(
                     self,
                     m,
                     transaction,
                     link,
                     p1,
                     p2,
                     added,
                     removed,
                     readtree=None,
                     match=None,
                 ):
                     try:
                         if p1 not in self.fulltextcache:
                             raise FastdeltaUnavailable()
                         # If our first parent is in the manifest cache, we can
                         # compute a delta here using properties we know about the
                         # manifest up-front, which may save time later for the
                         # revlog layer.
                         _checkforbidden(added)
                         # combine the changed lists into one sorted iterator
                         work = heapq.merge(
                             [(x, False) for x in sorted(added)],
                             [(x, True) for x in sorted(removed)],
                         )
                         arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)
                         cachedelta = self._revlog.rev(p1), deltatext
                         text = util.buffer(arraytext)
                         n = self._revlog.addrevision(
                             text, transaction, link, p1, p2, cachedelta
                         )
                     except FastdeltaUnavailable:
                         # The first parent manifest isn't already loaded or the
                         # manifest implementation doesn't support fastdelta, so
                         # we'll just encode a fulltext of the manifest and pass
                         # that through to the revlog layer, and let it handle the
                         # delta process.
                         if self._treeondisk:
                             assert readtree, b"readtree must be set for treemanifest writes"
                             assert match, b"match must be specified for treemanifest writes"
                             m1 = readtree(self.tree, p1)
                             m2 = readtree(self.tree, p2)
                             n = self._addtree(
                                 m, transaction, link, m1, m2, readtree, match=match
                             )
                             arraytext = None
                         else:
                             text = m.text()
                             n = self._revlog.addrevision(text, transaction, link, p1, p2)
                             arraytext = bytearray(text)
                     if arraytext is not None:
                         self.fulltextcache[n] = arraytext
                     return n
                 def _addtree(self, m, transaction, link, m1, m2, readtree, match):
                     # If the manifest is unchanged compared to one parent,
                     # don't write a new revision
                     if self.tree != b'' and (
                         m.unmodifiedsince(m1) or m.unmodifiedsince(m2)
                     ):
                         return m.node()
                     def writesubtree(subm, subp1, subp2, match):
                         sublog = self.dirlog(subm.dir())
                         sublog.add(
                             subm,
                             transaction,
                             link,
                             subp1,
                             subp2,
                             None,
                             None,
                             readtree=readtree,
                             match=match,
                         )
                     m.writesubtrees(m1, m2, writesubtree, match)
                     text = m.dirtext()
                     n = None
                     if self.tree != b'':
                         # Double-check whether contents are unchanged to one parent
                         if text == m1.dirtext():
                             n = m1.node()
                         elif text == m2.dirtext():
                             n = m2.node()
                     if not n:
                         n = self._revlog.addrevision(
                             text, transaction, link, m1.node(), m2.node()
                         )
                     # Save nodeid so parent manifest can calculate its nodeid
                     m.setnode(n)
                     return n
                 def __len__(self):
                     return len(self._revlog)
                 def __iter__(self):
                     return self._revlog.__iter__()
                 def rev(self, node):
                     return self._revlog.rev(node)
                 def node(self, rev):
                     return self._revlog.node(rev)
                 def lookup(self, value):
                     return self._revlog.lookup(value)
                 def parentrevs(self, rev):
                     return self._revlog.parentrevs(rev)
                 def parents(self, node):
                     return self._revlog.parents(node)
                 def linkrev(self, rev):
                     return self._revlog.linkrev(rev)
                 def checksize(self):
                     return self._revlog.checksize()
                 def revision(self, node, _df=None, raw=False):
                     return self._revlog.revision(node, _df=_df, raw=raw)
                 def rawdata(self, node, _df=None):
                     return self._revlog.rawdata(node, _df=_df)
                 def revdiff(self, rev1, rev2):
                     return self._revlog.revdiff(rev1, rev2)
                 def cmp(self, node, text):
                     return self._revlog.cmp(node, text)
                 def deltaparent(self, rev):
                     return self._revlog.deltaparent(rev)
                 def emitrevisions(
                     self,
                     nodes,
                     nodesorder=None,
                     revisiondata=False,
                     assumehaveparentrevisions=False,
                     deltamode=repository.CG_DELTAMODE_STD,
                 ):
                     return self._revlog.emitrevisions(
                         nodes,
                         nodesorder=nodesorder,
                         revisiondata=revisiondata,
                         assumehaveparentrevisions=assumehaveparentrevisions,
                         deltamode=deltamode,
                     )
                 def addgroup(self, deltas, linkmapper, transaction, addrevisioncb=None):
                     return self._revlog.addgroup(
                         deltas, linkmapper, transaction, addrevisioncb=addrevisioncb
                     )
                 def rawsize(self, rev):
                     return self._revlog.rawsize(rev)
                 def getstrippoint(self, minlink):
                     return self._revlog.getstrippoint(minlink)
                 def strip(self, minlink, transaction):
                     return self._revlog.strip(minlink, transaction)
                 def files(self):
                     return self._revlog.files()
                 def clone(self, tr, destrevlog, **kwargs):
                     if not isinstance(destrevlog, manifestrevlog):
                         raise error.ProgrammingError(b'expected manifestrevlog to clone()')
                     return self._revlog.clone(tr, destrevlog._revlog, **kwargs)
                 def storageinfo(
                     self,
                     exclusivefiles=False,
                     sharedfiles=False,
                     revisionscount=False,
                     trackedsize=False,
                     storedsize=False,
                 ):
                     return self._revlog.storageinfo(
                         exclusivefiles=exclusivefiles,
                         sharedfiles=sharedfiles,
                         revisionscount=revisionscount,
                         trackedsize=trackedsize,
                         storedsize=storedsize,
                     )
                 @property
                 def indexfile(self):
                     return self._revlog.indexfile
                 @indexfile.setter
                 def indexfile(self, value):
                     self._revlog.indexfile = value
                 @property
                 def opener(self):
                     return self._revlog.opener
                 @opener.setter
                 def opener(self, value):
                     self._revlog.opener = value
             @interfaceutil.implementer(repository.imanifestlog)
             class manifestlog(object):
                 """A collection class representing the collection of manifest snapshots
                 referenced by commits in the repository.
                 In this situation, 'manifest' refers to the abstract concept of a snapshot
                 of the list of files in the given commit. Consumers of the output of this
                 class do not care about the implementation details of the actual manifests
                 they receive (i.e. tree or flat or lazily loaded, etc)."""
                 def __init__(self, opener, repo, rootstore, narrowmatch):
                     usetreemanifest = False
                     cachesize = 4
                     opts = getattr(opener, 'options', None)
                     if opts is not None:
                         usetreemanifest = opts.get(b'treemanifest', usetreemanifest)
                         cachesize = opts.get(b'manifestcachesize', cachesize)
                     self._treemanifests = usetreemanifest
                     self._rootstore = rootstore
                     self._rootstore._setupmanifestcachehooks(repo)
                     self._narrowmatch = narrowmatch
                     # A cache of the manifestctx or treemanifestctx for each directory
                     self._dirmancache = {}
                     self._dirmancache[b''] = util.lrucachedict(cachesize)
                     self._cachesize = cachesize
                 def __getitem__(self, node):
                     """Retrieves the manifest instance for the given node. Throws a
                     LookupError if not found.
                     """
                     return self.get(b'', node)
                 def get(self, tree, node, verify=True):
                     """Retrieves the manifest instance for the given node. Throws a
                     LookupError if not found.
                     `verify` - if True an exception will be thrown if the node is not in
                                the revlog
                     """
                     if node in self._dirmancache.get(tree, ()):
                         return self._dirmancache[tree][node]
                     if not self._narrowmatch.always():
                         if not self._narrowmatch.visitdir(tree[:-1]):
                             return excludeddirmanifestctx(tree, node)
                     if tree:
                         if self._rootstore._treeondisk:
                             if verify:
                                 # Side-effect is LookupError is raised if node doesn't
                                 # exist.
                                 self.getstorage(tree).rev(node)
                             m = treemanifestctx(self, tree, node)
                         else:
                             raise error.Abort(
                                 _(
                                     b"cannot ask for manifest directory '%s' in a flat "
                                     b"manifest"
                                 )
                                 % tree
                             )
                     else:
                         if verify:
                             # Side-effect is LookupError is raised if node doesn't exist.
                             self._rootstore.rev(node)
                         if self._treemanifests:
                             m = treemanifestctx(self, b'', node)
                         else:
                             m = manifestctx(self, node)
                     if node != nullid:
                         mancache = self._dirmancache.get(tree)
                         if not mancache:
                             mancache = util.lrucachedict(self._cachesize)
                             self._dirmancache[tree] = mancache
                         mancache[node] = m
                     return m
                 def getstorage(self, tree):
                     return self._rootstore.dirlog(tree)
                 def clearcaches(self, clear_persisted_data=False):
                     self._dirmancache.clear()
                     self._rootstore.clearcaches(clear_persisted_data=clear_persisted_data)
                 def rev(self, node):
                     return self._rootstore.rev(node)
             @interfaceutil.implementer(repository.imanifestrevisionwritable)
             class memmanifestctx(object):
                 def __init__(self, manifestlog):
                     self._manifestlog = manifestlog
                     self._manifestdict = manifestdict()
                 def _storage(self):
                     return self._manifestlog.getstorage(b'')
                 def copy(self):
                     memmf = memmanifestctx(self._manifestlog)
                     memmf._manifestdict = self.read().copy()
                     return memmf
                 def read(self):
                     return self._manifestdict
                 def write(self, transaction, link, p1, p2, added, removed, match=None):
                     return self._storage().add(
                         self._manifestdict,
                         transaction,
                         link,
                         p1,
                         p2,
                         added,
                         removed,
                         match=match,
                     )
             @interfaceutil.implementer(repository.imanifestrevisionstored)
             class manifestctx(object):
                 """A class representing a single revision of a manifest, including its
                 contents, its parent revs, and its linkrev.
                 """
                 def __init__(self, manifestlog, node):
                     self._manifestlog = manifestlog
                     self._data = None
                     self._node = node
                     # TODO: We eventually want p1, p2, and linkrev exposed on this class,
                     # but let's add it later when something needs it and we can load it
                     # lazily.
                     # self.p1, self.p2 = store.parents(node)
                     # rev = store.rev(node)
                     # self.linkrev = store.linkrev(rev)
                 def _storage(self):
                     return self._manifestlog.getstorage(b'')
                 def node(self):
                     return self._node
                 def copy(self):
                     memmf = memmanifestctx(self._manifestlog)
                     memmf._manifestdict = self.read().copy()
                     return memmf
                 @propertycache
                 def parents(self):
                     return self._storage().parents(self._node)
                 def read(self):
                     if self._data is None:
                         if self._node == nullid:
                             self._data = manifestdict()
                         else:
                             store = self._storage()
                             if self._node in store.fulltextcache:
                                 text = pycompat.bytestr(store.fulltextcache[self._node])
                             else:
                                 text = store.revision(self._node)
                                 arraytext = bytearray(text)
                                 store.fulltextcache[self._node] = arraytext
                             self._data = manifestdict(text)
                     return self._data
                 def readfast(self, shallow=False):
                     '''Calls either readdelta or read, based on which would be less work.
                     readdelta is called if the delta is against the p1, and therefore can be
                     read quickly.
                     If `shallow` is True, nothing changes since this is a flat manifest.
                     '''
                     store = self._storage()
                     r = store.rev(self._node)
                     deltaparent = store.deltaparent(r)
                     if deltaparent != nullrev and deltaparent in store.parentrevs(r):
                         return self.readdelta()
                     return self.read()
                 def readdelta(self, shallow=False):
                     '''Returns a manifest containing just the entries that are present
                     in this manifest, but not in its p1 manifest. This is efficient to read
                     if the revlog delta is already p1.
                     Changing the value of `shallow` has no effect on flat manifests.
                     '''
                     store = self._storage()
                     r = store.rev(self._node)
                     d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))
                     return manifestdict(d)
                 def find(self, key):
                     return self.read().find(key)
             @interfaceutil.implementer(repository.imanifestrevisionwritable)
             class memtreemanifestctx(object):
                 def __init__(self, manifestlog, dir=b''):
                     self._manifestlog = manifestlog
                     self._dir = dir
                     self._treemanifest = treemanifest()
                 def _storage(self):
                     return self._manifestlog.getstorage(b'')
                 def copy(self):
                     memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)
                     memmf._treemanifest = self._treemanifest.copy()
                     return memmf
                 def read(self):
                     return self._treemanifest
                 def write(self, transaction, link, p1, p2, added, removed, match=None):
                     def readtree(dir, node):
                         return self._manifestlog.get(dir, node).read()
                     return self._storage().add(
                         self._treemanifest,
                         transaction,
                         link,
                         p1,
                         p2,
                         added,
                         removed,
                         readtree=readtree,
                         match=match,
                     )
             @interfaceutil.implementer(repository.imanifestrevisionstored)
             class treemanifestctx(object):
                 def __init__(self, manifestlog, dir, node):
                     self._manifestlog = manifestlog
                     self._dir = dir
                     self._data = None
                     self._node = node
                     # TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that
                     # we can instantiate treemanifestctx objects for directories we don't
                     # have on disk.
                     # self.p1, self.p2 = store.parents(node)
                     # rev = store.rev(node)
                     # self.linkrev = store.linkrev(rev)
                 def _storage(self):
                     narrowmatch = self._manifestlog._narrowmatch
                     if not narrowmatch.always():
                         if not narrowmatch.visitdir(self._dir[:-1]):
                             return excludedmanifestrevlog(self._dir)
                     return self._manifestlog.getstorage(self._dir)
                 def read(self):
                     if self._data is None:
                         store = self._storage()
                         if self._node == nullid:
                             self._data = treemanifest()
                         # TODO accessing non-public API
                         elif store._treeondisk:
                             m = treemanifest(dir=self._dir)
                             def gettext():
                                 return store.revision(self._node)
                             def readsubtree(dir, subm):
                                 # Set verify to False since we need to be able to create
                                 # subtrees for trees that don't exist on disk.
                                 return self._manifestlog.get(dir, subm, verify=False).read()
                             m.read(gettext, readsubtree)
                             m.setnode(self._node)
                             self._data = m
                         else:
                             if self._node in store.fulltextcache:
                                 text = pycompat.bytestr(store.fulltextcache[self._node])
                             else:
                                 text = store.revision(self._node)
                                 arraytext = bytearray(text)
                                 store.fulltextcache[self._node] = arraytext
                             self._data = treemanifest(dir=self._dir, text=text)
                     return self._data
                 def node(self):
                     return self._node
                 def copy(self):
                     memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)
                     memmf._treemanifest = self.read().copy()
                     return memmf
                 @propertycache
                 def parents(self):
                     return self._storage().parents(self._node)
                 def readdelta(self, shallow=False):
                     '''Returns a manifest containing just the entries that are present
                     in this manifest, but not in its p1 manifest. This is efficient to read
                     if the revlog delta is already p1.
                     If `shallow` is True, this will read the delta for this directory,
                     without recursively reading subdirectory manifests. Instead, any
                     subdirectory entry will be reported as it appears in the manifest, i.e.
                     the subdirectory will be reported among files and distinguished only by
                     its 't' flag.
                     '''
                     store = self._storage()
                     if shallow:
                         r = store.rev(self._node)
                         d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))
                         return manifestdict(d)
                     else:
                         # Need to perform a slow delta
                         r0 = store.deltaparent(store.rev(self._node))
                         m0 = self._manifestlog.get(self._dir, store.node(r0)).read()
                         m1 = self.read()
                         md = treemanifest(dir=self._dir)
                         for f, ((n0, fl0), (n1, fl1)) in pycompat.iteritems(m0.diff(m1)):
                             if n1:
                                 md[f] = n1
                                 if fl1:
                                     md.setflag(f, fl1)
                         return md
                 def readfast(self, shallow=False):
                     '''Calls either readdelta or read, based on which would be less work.
                     readdelta is called if the delta is against the p1, and therefore can be
                     read quickly.
                     If `shallow` is True, it only returns the entries from this manifest,
                     and not any submanifests.
                     '''
                     store = self._storage()
                     r = store.rev(self._node)
                     deltaparent = store.deltaparent(r)
                     if deltaparent != nullrev and deltaparent in store.parentrevs(r):
                         return self.readdelta(shallow=shallow)
                     if shallow:
                         return manifestdict(store.revision(self._node))
                     else:
                         return self.read()
                 def find(self, key):
                     return self.read().find(key)
             class excludeddir(treemanifest):
                 """Stand-in for a directory that is excluded from the repository.
                 With narrowing active on a repository that uses treemanifests,
                 some of the directory revlogs will be excluded from the resulting
                 clone. This is a huge storage win for clients, but means we need
                 some sort of pseudo-manifest to surface to internals so we can
                 detect a merge conflict outside the narrowspec. That's what this
                 class is: it stands in for a directory whose node is known, but
                 whose contents are unknown.
                 """
                 def __init__(self, dir, node):
                     super(excludeddir, self).__init__(dir)
                     self._node = node
                     # Add an empty file, which will be included by iterators and such,
                     # appearing as the directory itself (i.e. something like "dir/")
                     self._files[b''] = node
                     self._flags[b''] = b't'
                 # Manifests outside the narrowspec should never be modified, so avoid
                 # copying. This makes a noticeable difference when there are very many
                 # directories outside the narrowspec. Also, it makes sense for the copy to
                 # be of the same type as the original, which would not happen with the
                 # super type's copy().
                 def copy(self):
                     return self
             class excludeddirmanifestctx(treemanifestctx):
                 """context wrapper for excludeddir - see that docstring for rationale"""
                 def __init__(self, dir, node):
                     self._dir = dir
                     self._node = node
                 def read(self):
                     return excludeddir(self._dir, self._node)
                 def write(self, *args):
                     raise error.ProgrammingError(
                         b'attempt to write manifest from excluded dir %s' % self._dir
                     )
             class excludedmanifestrevlog(manifestrevlog):
                 """Stand-in for excluded treemanifest revlogs.
                 When narrowing is active on a treemanifest repository, we'll have
                 references to directories we can't see due to the revlog being
                 skipped. This class exists to conform to the manifestrevlog
                 interface for those directories and proactively prevent writes to
                 outside the narrowspec.
                 """
                 def __init__(self, dir):
                     self._dir = dir
                 def __len__(self):
                     raise error.ProgrammingError(
                         b'attempt to get length of excluded dir %s' % self._dir
                     )
                 def rev(self, node):
                     raise error.ProgrammingError(
                         b'attempt to get rev from excluded dir %s' % self._dir
                     )
                 def linkrev(self, node):
                     raise error.ProgrammingError(
                         b'attempt to get linkrev from excluded dir %s' % self._dir
                     )
                 def node(self, rev):
                     raise error.ProgrammingError(
                         b'attempt to get node from excluded dir %s' % self._dir
                     )
                 def add(self, *args, **kwargs):
                     # We should never write entries in dirlogs outside the narrow clone.
                     # However, the method still gets called from writesubtree() in
                     # _addtree(), so we need to handle it. We should possibly make that
                     # avoid calling add() with a clean manifest (_dirty is always False
                     # in excludeddir instances).
                     pass