upstream/mercurial-mirror Commit - r52657:2f88df88

1

# manifest.py - manifest revision class for mercurial

1

# manifest.py - manifest revision class for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

9

import heapq

9

import heapq

10

import itertools

10

import itertools

11

import struct

11

import struct

12

import weakref

12

import weakref

13

14

from .i18n import _

14

from .i18n import _

15

from .node import (

15

from .node import (

16

bin,

16

bin,

17

hex,

17

hex,

18

nullrev,

18

nullrev,

19

)

19

)

20

from . import (

20

from . import (

21

encoding,

21

encoding,

22

error,

22

error,

23

match as matchmod,

23

match as matchmod,

24

mdiff,

24

mdiff,

25

pathutil,

25

pathutil,

26

policy,

26

policy,

27

pycompat,

27

pycompat,

28

revlog,

28

revlog,

29

util,

29

util,

30

)

30

)

31

from .interfaces import (

31

from .interfaces import (

32

repository,

32

repository,

33

util as interfaceutil,

33

util as interfaceutil,

34

)

34

)

35

from .revlogutils import (

35

from .revlogutils import (

36

constants as revlog_constants,

36

constants as revlog_constants,

37

)

37

)

38

39

parsers = policy.importmod('parsers')

39

parsers = policy.importmod('parsers')

40

propertycache = util.propertycache

40

propertycache = util.propertycache

41

42

# Allow tests to more easily test the alternate path in manifestdict.fastdelta()

42

# Allow tests to more easily test the alternate path in manifestdict.fastdelta()

43

FASTDELTA_TEXTDIFF_THRESHOLD = 1000

43

FASTDELTA_TEXTDIFF_THRESHOLD = 1000

44

45

46

def _parse(nodelen, data):

46

def _parse(nodelen, data):

47

# This method does a little bit of excessive-looking

47

# This method does a little bit of excessive-looking

48

# precondition checking. This is so that the behavior of this

48

# precondition checking. This is so that the behavior of this

49

# class exactly matches its C counterpart to try and help

49

# class exactly matches its C counterpart to try and help

50

# prevent surprise breakage for anyone that develops against

50

# prevent surprise breakage for anyone that develops against

51

# the pure version.

51

# the pure version.

52

if data and data[-1:] != b'\n':

52

if data and data[-1:] != b'\n':

53

raise ValueError(b'Manifest did not end in a newline.')

53

raise ValueError(b'Manifest did not end in a newline.')

54

prev = None

54

prev = None

55

for l in data.splitlines():

55

for l in data.splitlines():

56

if prev is not None and prev > l:

56

if prev is not None and prev > l:

57

raise ValueError(b'Manifest lines not in sorted order.')

57

raise ValueError(b'Manifest lines not in sorted order.')

58

prev = l

58

prev = l

59

f, n = l.split(b'\0')

59

f, n = l.split(b'\0')

60

nl = len(n)

60

nl = len(n)

61

flags = n[-1:]

61

flags = n[-1:]

62

if flags in _manifestflags:

62

if flags in _manifestflags:

63

n = n[:-1]

63

n = n[:-1]

64

nl -= 1

64

nl -= 1

65

else:

65

else:

66

flags = b''

66

flags = b''

67

if nl != 2 * nodelen:

67

if nl != 2 * nodelen:

68

raise ValueError(b'Invalid manifest line')

68

raise ValueError(b'Invalid manifest line')

69

70

yield f, bin(n), flags

70

yield f, bin(n), flags

71

72

73

def _text(it):

73

def _text(it):

74

files = []

74

files = []

75

lines = []

75

lines = []

76

for f, n, fl in it:

76

for f, n, fl in it:

77

files.append(f)

77

files.append(f)

78

# if this is changed to support newlines in filenames,

78

# if this is changed to support newlines in filenames,

79

# be sure to check the templates/ dir again (especially *-raw.tmpl)

79

# be sure to check the templates/ dir again (especially *-raw.tmpl)

80

lines.append(b"%s\0%s%s\n" % (f, hex(n), fl))

80

lines.append(b"%s\0%s%s\n" % (f, hex(n), fl))

81

82

_checkforbidden(files)

82

_checkforbidden(files)

83

return b''.join(lines)

83

return b''.join(lines)

84

85

86

class lazymanifestiter:

86

class lazymanifestiter:

87

def __init__(self, lm):

87

def __init__(self, lm):

88

self.pos = 0

88

self.pos = 0

89

self.lm = lm

89

self.lm = lm

90

91

def __iter__(self):

91

def __iter__(self):

92

return self

92

return self

93

94

def next(self):

94

def next(self):

95

try:

95

try:

96

data, pos = self.lm._get(self.pos)

96

data, pos = self.lm._get(self.pos)

97

except IndexError:

97

except IndexError:

98

raise StopIteration

98

raise StopIteration

99

if pos == -1:

99

if pos == -1:

100

self.pos += 1

100

self.pos += 1

101

return data[0]

101

return data[0]

102

self.pos += 1

102

self.pos += 1

103

zeropos = data.find(b'\x00', pos)

103

zeropos = data.find(b'\x00', pos)

104

return data[pos:zeropos]

104

return data[pos:zeropos]

105

106

__next__ = next

106

__next__ = next

107

108

109

class lazymanifestiterentries:

109

class lazymanifestiterentries:

110

def __init__(self, lm):

110

def __init__(self, lm):

111

self.lm = lm

111

self.lm = lm

112

self.pos = 0

112

self.pos = 0

113

114

def __iter__(self):

114

def __iter__(self):

115

return self

115

return self

116

117

def next(self):

117

def next(self):

118

try:

118

try:

119

data, pos = self.lm._get(self.pos)

119

data, pos = self.lm._get(self.pos)

120

except IndexError:

120

except IndexError:

121

raise StopIteration

121

raise StopIteration

122

if pos == -1:

122

if pos == -1:

123

self.pos += 1

123

self.pos += 1

124

return data

124

return data

125

zeropos = data.find(b'\x00', pos)

125

zeropos = data.find(b'\x00', pos)

126

nlpos = data.find(b'\n', pos)

126

nlpos = data.find(b'\n', pos)

127

if zeropos == -1 or nlpos == -1 or nlpos < zeropos:

127

if zeropos == -1 or nlpos == -1 or nlpos < zeropos:

128

raise error.StorageError(b'Invalid manifest line')

128

raise error.StorageError(b'Invalid manifest line')

129

flags = data[nlpos - 1 : nlpos]

129

flags = data[nlpos - 1 : nlpos]

130

if flags in _manifestflags:

130

if flags in _manifestflags:

131

hlen = nlpos - zeropos - 2

131

hlen = nlpos - zeropos - 2

132

else:

132

else:

133

hlen = nlpos - zeropos - 1

133

hlen = nlpos - zeropos - 1

134

flags = b''

134

flags = b''

135

if hlen != 2 * self.lm._nodelen:

135

if hlen != 2 * self.lm._nodelen:

136

raise error.StorageError(b'Invalid manifest line')

136

raise error.StorageError(b'Invalid manifest line')

137

hashval = unhexlify(

137

hashval = unhexlify(

138

data, self.lm.extrainfo[self.pos], zeropos + 1, hlen

138

data, self.lm.extrainfo[self.pos], zeropos + 1, hlen

139

)

139

)

140

self.pos += 1

140

self.pos += 1

141

return (data[pos:zeropos], hashval, flags)

141

return (data[pos:zeropos], hashval, flags)

142

143

__next__ = next

143

__next__ = next

144

145

146

def unhexlify(data, extra, pos, length):

146

def unhexlify(data: bytes, extra: int, pos, length: int):

147

s = bin(data[pos : pos + length])

147

s = bin(data[pos : pos + length])

148

if extra:

148

if extra:

149

s += ~~chr~~(extra & 0xFF)

149

s += bytes([extra & 0xFF])

150

return s

150

return s

151

152

153

def _cmp(a, b):

153

def _cmp(a, b):

154

return (a > b) - (a < b)

154

return (a > b) - (a < b)

155

156

157

_manifestflags = {b'', b'l', b't', b'x'}

157

_manifestflags = {b'', b'l', b't', b'x'}

158

159

160

class _lazymanifest:

160

class _lazymanifest:

161

"""A pure python manifest backed by a byte string. It is supplimented with

161

"""A pure python manifest backed by a byte string. It is supplimented with

162

internal lists as it is modified, until it is compacted back to a pure byte

162

internal lists as it is modified, until it is compacted back to a pure byte

163

string.

163

string.

164

165

``data`` is the initial manifest data.

165

``data`` is the initial manifest data.

166

167

``positions`` is a list of offsets, one per manifest entry. Positive

167

``positions`` is a list of offsets, one per manifest entry. Positive

168

values are offsets into ``data``, negative values are offsets into the

168

values are offsets into ``data``, negative values are offsets into the

169

``extradata`` list. When an entry is removed, its entry is dropped from

169

``extradata`` list. When an entry is removed, its entry is dropped from

170

``positions``. The values are encoded such that when walking the list and

170

``positions``. The values are encoded such that when walking the list and

171

indexing into ``data`` or ``extradata`` as appropriate, the entries are

171

indexing into ``data`` or ``extradata`` as appropriate, the entries are

172

sorted by filename.

172

sorted by filename.

173

174

``extradata`` is a list of (key, hash, flags) for entries that were added or

174

``extradata`` is a list of (key, hash, flags) for entries that were added or

175

modified since the manifest was created or compacted.

175

modified since the manifest was created or compacted.

176

"""

176

"""

177

178

def __init__(

178

def __init__(

179

self,

179

self,

180

nodelen,

180

nodelen,

181

data,

181

data,

182

positions=None,

182

positions=None,

183

extrainfo=None,

183

extrainfo=None,

184

extradata=None,

184

extradata=None,

185

hasremovals=False,

185

hasremovals=False,

186

):

186

):

187

self._nodelen = nodelen

187

self._nodelen = nodelen

188

if positions is None:

188

if positions is None:

189

self.positions = self.findlines(data)

189

self.positions = self.findlines(data)

190

self.extrainfo = [0] * len(self.positions)

190

self.extrainfo = [0] * len(self.positions)

191

self.data = data

191

self.data = data

192

self.extradata = []

192

self.extradata = []

193

self.hasremovals = False

193

self.hasremovals = False

194

else:

194

else:

195

self.positions = positions[:]

195

self.positions = positions[:]

196

self.extrainfo = extrainfo[:]

196

self.extrainfo = extrainfo[:]

197

self.extradata = extradata[:]

197

self.extradata = extradata[:]

198

self.data = data

198

self.data = data

199

self.hasremovals = hasremovals

199

self.hasremovals = hasremovals

200

201

def findlines(self, data):

201

def findlines(self, data):

202

if not data:

202

if not data:

203

return []

203

return []

204

pos = data.find(b"\n")

204

pos = data.find(b"\n")

205

if pos == -1 or data[-1:] != b'\n':

205

if pos == -1 or data[-1:] != b'\n':

206

raise ValueError(b"Manifest did not end in a newline.")

206

raise ValueError(b"Manifest did not end in a newline.")

207

positions = [0]

207

positions = [0]

208

prev = data[: data.find(b'\x00')]

208

prev = data[: data.find(b'\x00')]

209

while pos < len(data) - 1 and pos != -1:

209

while pos < len(data) - 1 and pos != -1:

210

positions.append(pos + 1)

210

positions.append(pos + 1)

211

nexts = data[pos + 1 : data.find(b'\x00', pos + 1)]

211

nexts = data[pos + 1 : data.find(b'\x00', pos + 1)]

212

if nexts < prev:

212

if nexts < prev:

213

raise ValueError(b"Manifest lines not in sorted order.")

213

raise ValueError(b"Manifest lines not in sorted order.")

214

prev = nexts

214

prev = nexts

215

pos = data.find(b"\n", pos + 1)

215

pos = data.find(b"\n", pos + 1)

216

return positions

216

return positions

217

218

def _get(self, index):

218

def _get(self, index):

219

# get the position encoded in pos:

219

# get the position encoded in pos:

220

# positive number is an index in 'data'

220

# positive number is an index in 'data'

221

# negative number is in extrapieces

221

# negative number is in extrapieces

222

pos = self.positions[index]

222

pos = self.positions[index]

223

if pos >= 0:

223

if pos >= 0:

224

return self.data, pos

224

return self.data, pos

225

return self.extradata[-pos - 1], -1

225

return self.extradata[-pos - 1], -1

226

227

def _getkey(self, pos):

227

def _getkey(self, pos):

228

if pos >= 0:

228

if pos >= 0:

229

return self.data[pos : self.data.find(b'\x00', pos + 1)]

229

return self.data[pos : self.data.find(b'\x00', pos + 1)]

230

return self.extradata[-pos - 1][0]

230

return self.extradata[-pos - 1][0]

231

232

def bsearch(self, key):

232

def bsearch(self, key):

233

first = 0

233

first = 0

234

last = len(self.positions) - 1

234

last = len(self.positions) - 1

235

236

while first <= last:

236

while first <= last:

237

midpoint = (first + last) // 2

237

midpoint = (first + last) // 2

238

nextpos = self.positions[midpoint]

238

nextpos = self.positions[midpoint]

239

candidate = self._getkey(nextpos)

239

candidate = self._getkey(nextpos)

240

r = _cmp(key, candidate)

240

r = _cmp(key, candidate)

241

if r == 0:

241

if r == 0:

242

return midpoint

242

return midpoint

243

else:

243

else:

244

if r < 0:

244

if r < 0:

245

last = midpoint - 1

245

last = midpoint - 1

246

else:

246

else:

247

first = midpoint + 1

247

first = midpoint + 1

248

return -1

248

return -1

249

250

def bsearch2(self, key):

250

def bsearch2(self, key):

251

# same as the above, but will always return the position

251

# same as the above, but will always return the position

252

# done for performance reasons

252

# done for performance reasons

253

first = 0

253

first = 0

254

last = len(self.positions) - 1

254

last = len(self.positions) - 1

255

256

while first <= last:

256

while first <= last:

257

midpoint = (first + last) // 2

257

midpoint = (first + last) // 2

258

nextpos = self.positions[midpoint]

258

nextpos = self.positions[midpoint]

259

candidate = self._getkey(nextpos)

259

candidate = self._getkey(nextpos)

260

r = _cmp(key, candidate)

260

r = _cmp(key, candidate)

261

if r == 0:

261

if r == 0:

262

return (midpoint, True)

262

return (midpoint, True)

263

else:

263

else:

264

if r < 0:

264

if r < 0:

265

last = midpoint - 1

265

last = midpoint - 1

266

else:

266

else:

267

first = midpoint + 1

267

first = midpoint + 1

268

return (first, False)

268

return (first, False)

269

270

def __contains__(self, key):

270

def __contains__(self, key):

271

return self.bsearch(key) != -1

271

return self.bsearch(key) != -1

272

273

def __getitem__(self, key):

273

def __getitem__(self, key):

274

if not isinstance(key, bytes):

274

if not isinstance(key, bytes):

275

raise TypeError(b"getitem: manifest keys must be a bytes.")

275

raise TypeError(b"getitem: manifest keys must be a bytes.")

276

needle = self.bsearch(key)

276

needle = self.bsearch(key)

277

if needle == -1:

277

if needle == -1:

278

raise KeyError

278

raise KeyError

279

data, pos = self._get(needle)

279

data, pos = self._get(needle)

280

if pos == -1:

280

if pos == -1:

281

return (data[1], data[2])

281

return (data[1], data[2])

282

zeropos = data.find(b'\x00', pos)

282

zeropos = data.find(b'\x00', pos)

283

nlpos = data.find(b'\n', zeropos)

283

nlpos = data.find(b'\n', zeropos)

284

assert 0 <= needle <= len(self.positions)

284

assert 0 <= needle <= len(self.positions)

285

assert len(self.extrainfo) == len(self.positions)

285

assert len(self.extrainfo) == len(self.positions)

286

if zeropos == -1 or nlpos == -1 or nlpos < zeropos:

286

if zeropos == -1 or nlpos == -1 or nlpos < zeropos:

287

raise error.StorageError(b'Invalid manifest line')

287

raise error.StorageError(b'Invalid manifest line')

288

hlen = nlpos - zeropos - 1

288

hlen = nlpos - zeropos - 1

289

flags = data[nlpos - 1 : nlpos]

289

flags = data[nlpos - 1 : nlpos]

290

if flags in _manifestflags:

290

if flags in _manifestflags:

291

hlen -= 1

291

hlen -= 1

292

else:

292

else:

293

flags = b''

293

flags = b''

294

if hlen != 2 * self._nodelen:

294

if hlen != 2 * self._nodelen:

295

raise error.StorageError(b'Invalid manifest line')

295

raise error.StorageError(b'Invalid manifest line')

296

hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, hlen)

296

hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, hlen)

297

return (hashval, flags)

297

return (hashval, flags)

298

299

def __delitem__(self, key):

299

def __delitem__(self, key):

300

needle, found = self.bsearch2(key)

300

needle, found = self.bsearch2(key)

301

if not found:

301

if not found:

302

raise KeyError

302

raise KeyError

303

cur = self.positions[needle]

303

cur = self.positions[needle]

304

self.positions = self.positions[:needle] + self.positions[needle + 1 :]

304

self.positions = self.positions[:needle] + self.positions[needle + 1 :]

305

self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1 :]

305

self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1 :]

306

if cur >= 0:

306

if cur >= 0:

307

# This does NOT unsort the list as far as the search functions are

307

# This does NOT unsort the list as far as the search functions are

308

# concerned, as they only examine lines mapped by self.positions.

308

# concerned, as they only examine lines mapped by self.positions.

309

self.data = self.data[:cur] + b'\x00' + self.data[cur + 1 :]

309

self.data = self.data[:cur] + b'\x00' + self.data[cur + 1 :]

310

self.hasremovals = True

310

self.hasremovals = True

311

312

def __setitem__(self, key, value):

312

def __setitem__(self, key, value):

313

if not isinstance(key, bytes):

313

if not isinstance(key, bytes):

314

raise TypeError(b"setitem: manifest keys must be a byte string.")

314

raise TypeError(b"setitem: manifest keys must be a byte string.")

315

if not isinstance(value, tuple) or len(value) != 2:

315

if not isinstance(value, tuple) or len(value) != 2:

316

raise TypeError(

316

raise TypeError(

317

b"Manifest values must be a tuple of (node, flags)."

317

b"Manifest values must be a tuple of (node, flags)."

318

)

318

)

319

hashval = value[0]

319

hashval = value[0]

320

if not isinstance(hashval, bytes) or len(hashval) not in (20, 32):

320

if not isinstance(hashval, bytes) or len(hashval) not in (20, 32):

321

raise TypeError(b"node must be a 20-byte or 32-byte byte string")

321

raise TypeError(b"node must be a 20-byte or 32-byte byte string")

322

flags = value[1]

322

flags = value[1]

323

if not isinstance(flags, bytes) or len(flags) > 1:

323

if not isinstance(flags, bytes) or len(flags) > 1:

324

raise TypeError(b"flags must a 0 or 1 byte string, got %r", flags)

324

raise TypeError(b"flags must a 0 or 1 byte string, got %r", flags)

325

needle, found = self.bsearch2(key)

325

needle, found = self.bsearch2(key)

326

if found:

326

if found:

327

# put the item

327

# put the item

328

pos = self.positions[needle]

328

pos = self.positions[needle]

329

if pos < 0:

329

if pos < 0:

330

self.extradata[-pos - 1] = (key, hashval, value[1])

330

self.extradata[-pos - 1] = (key, hashval, value[1])

331

else:

331

else:

332

# just don't bother

332

# just don't bother

333

self.extradata.append((key, hashval, value[1]))

333

self.extradata.append((key, hashval, value[1]))

334

self.positions[needle] = -len(self.extradata)

334

self.positions[needle] = -len(self.extradata)

335

else:

335

else:

336

# not found, put it in with extra positions

336

# not found, put it in with extra positions

337

self.extradata.append((key, hashval, value[1]))

337

self.extradata.append((key, hashval, value[1]))

338

self.positions = (

338

self.positions = (

339

self.positions[:needle]

339

self.positions[:needle]

340

+ [-len(self.extradata)]

340

+ [-len(self.extradata)]

341

+ self.positions[needle:]

341

+ self.positions[needle:]

342

)

342

)

343

self.extrainfo = (

343

self.extrainfo = (

344

self.extrainfo[:needle] + [0] + self.extrainfo[needle:]

344

self.extrainfo[:needle] + [0] + self.extrainfo[needle:]

345

)

345

)

346

347

def copy(self):

347

def copy(self):

348

# XXX call _compact like in C?

348

# XXX call _compact like in C?

349

return _lazymanifest(

349

return _lazymanifest(

350

self._nodelen,

350

self._nodelen,

351

self.data,

351

self.data,

352

self.positions,

352

self.positions,

353

self.extrainfo,

353

self.extrainfo,

354

self.extradata,

354

self.extradata,

355

self.hasremovals,

355

self.hasremovals,

356

)

356

)

357

358

def _compact(self):

358

def _compact(self):

359

# hopefully not called TOO often

359

# hopefully not called TOO often

360

if len(self.extradata) == 0 and not self.hasremovals:

360

if len(self.extradata) == 0 and not self.hasremovals:

361

return

361

return

362

l = []

362

l = []

363

i = 0

363

i = 0

364

offset = 0

364

offset = 0

365

self.extrainfo = [0] * len(self.positions)

365

self.extrainfo = [0] * len(self.positions)

366

while i < len(self.positions):

366

while i < len(self.positions):

367

if self.positions[i] >= 0:

367

if self.positions[i] >= 0:

368

cur = self.positions[i]

368

cur = self.positions[i]

369

last_cut = cur

369

last_cut = cur

370

371

# Collect all contiguous entries in the buffer at the current

371

# Collect all contiguous entries in the buffer at the current

372

# offset, breaking out only for added/modified items held in

372

# offset, breaking out only for added/modified items held in

373

# extradata, or a deleted line prior to the next position.

373

# extradata, or a deleted line prior to the next position.

374

while True:

374

while True:

375

self.positions[i] = offset

375

self.positions[i] = offset

376

i += 1

376

i += 1

377

if i == len(self.positions) or self.positions[i] < 0:

377

if i == len(self.positions) or self.positions[i] < 0:

378

break

378

break

379

380

# A removed file has no positions[] entry, but does have an

380

# A removed file has no positions[] entry, but does have an

381

# overwritten first byte. Break out and find the end of the

381

# overwritten first byte. Break out and find the end of the

382

# current good entry/entries if there is a removed file

382

# current good entry/entries if there is a removed file

383

# before the next position.

383

# before the next position.

384

if (

384

if (

385

self.hasremovals

385

self.hasremovals

386

and self.data.find(b'\n\x00', cur, self.positions[i])

386

and self.data.find(b'\n\x00', cur, self.positions[i])

387

!= -1

387

!= -1

388

):

388

):

389

break

389

break

390

391

offset += self.positions[i] - cur

391

offset += self.positions[i] - cur

392

cur = self.positions[i]

392

cur = self.positions[i]

393

end_cut = self.data.find(b'\n', cur)

393

end_cut = self.data.find(b'\n', cur)

394

if end_cut != -1:

394

if end_cut != -1:

395

end_cut += 1

395

end_cut += 1

396

offset += end_cut - cur

396

offset += end_cut - cur

397

l.append(self.data[last_cut:end_cut])

397

l.append(self.data[last_cut:end_cut])

398

else:

398

else:

399

while i < len(self.positions) and self.positions[i] < 0:

399

while i < len(self.positions) and self.positions[i] < 0:

400

cur = self.positions[i]

400

cur = self.positions[i]

401

t = self.extradata[-cur - 1]

401

t = self.extradata[-cur - 1]

402

l.append(self._pack(t))

402

l.append(self._pack(t))

403

self.positions[i] = offset

403

self.positions[i] = offset

404

# Hashes are either 20 bytes (old sha1s) or 32

404

# Hashes are either 20 bytes (old sha1s) or 32

405

# bytes (new non-sha1).

405

# bytes (new non-sha1).

406

hlen = 20

406

hlen = 20

407

if len(t[1]) > 25:

407

if len(t[1]) > 25:

408

hlen = 32

408

hlen = 32

409

if len(t[1]) > hlen:

409

if len(t[1]) > hlen:

410

self.extrainfo[i] = ord(t[1][hlen + 1])

410

self.extrainfo[i] = ord(t[1][hlen + 1])

411

offset += len(l[-1])

411

offset += len(l[-1])

412

i += 1

412

i += 1

413

self.data = b''.join(l)

413

self.data = b''.join(l)

414

self.hasremovals = False

414

self.hasremovals = False

415

self.extradata = []

415

self.extradata = []

416

417

def _pack(self, d):

417

def _pack(self, d):

418

n = d[1]

418

n = d[1]

419

assert len(n) in (20, 32)

419

assert len(n) in (20, 32)

420

return d[0] + b'\x00' + hex(n) + d[2] + b'\n'

420

return d[0] + b'\x00' + hex(n) + d[2] + b'\n'

421

422

def text(self):

422

def text(self):

423

self._compact()

423

self._compact()

424

return self.data

424

return self.data

425

426

def diff(self, m2, clean=False):

426

def diff(self, m2, clean=False):

427

'''Finds changes between the current manifest and m2.'''

427

'''Finds changes between the current manifest and m2.'''

428

# XXX think whether efficiency matters here

428

# XXX think whether efficiency matters here

429

diff = {}

429

diff = {}

430

431

for fn, e1, flags in self.iterentries():

431

for fn, e1, flags in self.iterentries():

432

if fn not in m2:

432

if fn not in m2:

433

diff[fn] = (e1, flags), (None, b'')

433

diff[fn] = (e1, flags), (None, b'')

434

else:

434

else:

435

e2 = m2[fn]

435

e2 = m2[fn]

436

if (e1, flags) != e2:

436

if (e1, flags) != e2:

437

diff[fn] = (e1, flags), e2

437

diff[fn] = (e1, flags), e2

438

elif clean:

438

elif clean:

439

diff[fn] = None

439

diff[fn] = None

440

441

for fn, e2, flags in m2.iterentries():

441

for fn, e2, flags in m2.iterentries():

442

if fn not in self:

442

if fn not in self:

443

diff[fn] = (None, b''), (e2, flags)

443

diff[fn] = (None, b''), (e2, flags)

444

445

return diff

445

return diff

446

447

def iterentries(self):

447

def iterentries(self):

448

return lazymanifestiterentries(self)

448

return lazymanifestiterentries(self)

449

450

def iterkeys(self):

450

def iterkeys(self):

451

return lazymanifestiter(self)

451

return lazymanifestiter(self)

452

453

def __iter__(self):

453

def __iter__(self):

454

return lazymanifestiter(self)

454

return lazymanifestiter(self)

455

456

def __len__(self):

456

def __len__(self):

457

return len(self.positions)

457

return len(self.positions)

458

459

def filtercopy(self, filterfn):

459

def filtercopy(self, filterfn):

460

# XXX should be optimized

460

# XXX should be optimized

461

c = _lazymanifest(self._nodelen, b'')

461

c = _lazymanifest(self._nodelen, b'')

462

for f, n, fl in self.iterentries():

462

for f, n, fl in self.iterentries():

463

if filterfn(f):

463

if filterfn(f):

464

c[f] = n, fl

464

c[f] = n, fl

465

return c

465

return c

466

467

468

try:

468

try:

469

_lazymanifest = parsers.lazymanifest

469

_lazymanifest = parsers.lazymanifest

470

except AttributeError:

470

except AttributeError:

471

pass

471

pass

472

473

474

@interfaceutil.implementer(repository.imanifestdict)

474

@interfaceutil.implementer(repository.imanifestdict)

475

class manifestdict:

475

class manifestdict:

476

def __init__(self, nodelen, data=b''):

476

def __init__(self, nodelen, data=b''):

477

self._nodelen = nodelen

477

self._nodelen = nodelen

478

self._lm = _lazymanifest(nodelen, data)

478

self._lm = _lazymanifest(nodelen, data)

479

480

def __getitem__(self, key):

480

def __getitem__(self, key):

481

return self._lm[key][0]

481

return self._lm[key][0]

482

483

def find(self, key):

483

def find(self, key):

484

return self._lm[key]

484

return self._lm[key]

485

486

def __len__(self):

486

def __len__(self):

487

return len(self._lm)

487

return len(self._lm)

488

489

def __nonzero__(self):

489

def __nonzero__(self):

490

# nonzero is covered by the __len__ function, but implementing it here

490

# nonzero is covered by the __len__ function, but implementing it here

491

# makes it easier for extensions to override.

491

# makes it easier for extensions to override.

492

return len(self._lm) != 0

492

return len(self._lm) != 0

493

494

__bool__ = __nonzero__

494

__bool__ = __nonzero__

495

496

def set(self, key, node, flags):

496

def set(self, key, node, flags):

497

self._lm[key] = node, flags

497

self._lm[key] = node, flags

498

499

def __setitem__(self, key, node):

499

def __setitem__(self, key, node):

500

self._lm[key] = node, self.flags(key)

500

self._lm[key] = node, self.flags(key)

501

502

def __contains__(self, key):

502

def __contains__(self, key):

503

if key is None:

503

if key is None:

504

return False

504

return False

505

return key in self._lm

505

return key in self._lm

506

507

def __delitem__(self, key):

507

def __delitem__(self, key):

508

del self._lm[key]

508

del self._lm[key]

509

510

def __iter__(self):

510

def __iter__(self):

511

return self._lm.__iter__()

511

return self._lm.__iter__()

512

513

def iterkeys(self):

513

def iterkeys(self):

514

return self._lm.iterkeys()

514

return self._lm.iterkeys()

515

516

def keys(self):

516

def keys(self):

517

return list(self.iterkeys())

517

return list(self.iterkeys())

518

519

def filesnotin(self, m2, match=None):

519

def filesnotin(self, m2, match=None):

520

'''Set of files in this manifest that are not in the other'''

520

'''Set of files in this manifest that are not in the other'''

521

if match is not None:

521

if match is not None:

522

match = matchmod.badmatch(match, lambda path, msg: None)

522

match = matchmod.badmatch(match, lambda path, msg: None)

523

sm2 = set(m2.walk(match))

523

sm2 = set(m2.walk(match))

524

return {f for f in self.walk(match) if f not in sm2}

524

return {f for f in self.walk(match) if f not in sm2}

525

return {f for f in self if f not in m2}

525

return {f for f in self if f not in m2}

526

527

@propertycache

527

@propertycache

528

def _dirs(self):

528

def _dirs(self):

529

return pathutil.dirs(self)

529

return pathutil.dirs(self)

530

531

def dirs(self):

531

def dirs(self):

532

return self._dirs

532

return self._dirs

533

534

def hasdir(self, dir):

534

def hasdir(self, dir):

535

return dir in self._dirs

535

return dir in self._dirs

536

537

def _filesfastpath(self, match):

537

def _filesfastpath(self, match):

538

"""Checks whether we can correctly and quickly iterate over matcher

538

"""Checks whether we can correctly and quickly iterate over matcher

539

files instead of over manifest files."""

539

files instead of over manifest files."""

540

files = match.files()

540

files = match.files()

541

return len(files) < 100 and (

541

return len(files) < 100 and (

542

match.isexact()

542

match.isexact()

543

or (match.prefix() and all(fn in self for fn in files))

543

or (match.prefix() and all(fn in self for fn in files))

544

)

544

)

545

546

def walk(self, match):

546

def walk(self, match):

547

"""Generates matching file names.

547

"""Generates matching file names.

548

549

Equivalent to manifest.matches(match).iterkeys(), but without creating

549

Equivalent to manifest.matches(match).iterkeys(), but without creating

550

an entirely new manifest.

550

an entirely new manifest.

551

552

It also reports nonexistent files by marking them bad with match.bad().

552

It also reports nonexistent files by marking them bad with match.bad().

553

"""

553

"""

554

if match.always():

554

if match.always():

555

for f in iter(self):

555

for f in iter(self):

556

yield f

556

yield f

557

return

557

return

558

559

fset = set(match.files())

559

fset = set(match.files())

560

561

# avoid the entire walk if we're only looking for specific files

561

# avoid the entire walk if we're only looking for specific files

562

if self._filesfastpath(match):

562

if self._filesfastpath(match):

563

for fn in sorted(fset):

563

for fn in sorted(fset):

564

if fn in self:

564

if fn in self:

565

yield fn

565

yield fn

566

return

566

return

567

568

for fn in self:

568

for fn in self:

569

if fn in fset:

569

if fn in fset:

570

# specified pattern is the exact name

570

# specified pattern is the exact name

571

fset.remove(fn)

571

fset.remove(fn)

572

if match(fn):

572

if match(fn):

573

yield fn

573

yield fn

574

575

# for dirstate.walk, files=[''] means "walk the whole tree".

575

# for dirstate.walk, files=[''] means "walk the whole tree".

576

# follow that here, too

576

# follow that here, too

577

fset.discard(b'')

577

fset.discard(b'')

578

579

for fn in sorted(fset):

579

for fn in sorted(fset):

580

if not self.hasdir(fn):

580

if not self.hasdir(fn):

581

match.bad(fn, None)

581

match.bad(fn, None)

582

583

def _matches(self, match):

583

def _matches(self, match):

584

'''generate a new manifest filtered by the match argument'''

584

'''generate a new manifest filtered by the match argument'''

585

if match.always():

585

if match.always():

586

return self.copy()

586

return self.copy()

587

588

if self._filesfastpath(match):

588

if self._filesfastpath(match):

589

m = manifestdict(self._nodelen)

589

m = manifestdict(self._nodelen)

590

lm = self._lm

590

lm = self._lm

591

for fn in match.files():

591

for fn in match.files():

592

if fn in lm:

592

if fn in lm:

593

m._lm[fn] = lm[fn]

593

m._lm[fn] = lm[fn]

594

return m

594

return m

595

596

m = manifestdict(self._nodelen)

596

m = manifestdict(self._nodelen)

597

m._lm = self._lm.filtercopy(match)

597

m._lm = self._lm.filtercopy(match)

598

return m

598

return m

599

600

def diff(self, m2, match=None, clean=False):

600

def diff(self, m2, match=None, clean=False):

601

"""Finds changes between the current manifest and m2.

601

"""Finds changes between the current manifest and m2.

602

603

Args:

603

Args:

604

m2: the manifest to which this manifest should be compared.

604

m2: the manifest to which this manifest should be compared.

605

clean: if true, include files unchanged between these manifests

605

clean: if true, include files unchanged between these manifests

606

with a None value in the returned dictionary.

606

with a None value in the returned dictionary.

607

608

The result is returned as a dict with filename as key and

608

The result is returned as a dict with filename as key and

609

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

609

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

610

nodeid in the current/other manifest and fl1/fl2 is the flag

610

nodeid in the current/other manifest and fl1/fl2 is the flag

611

in the current/other manifest. Where the file does not exist,

611

in the current/other manifest. Where the file does not exist,

612

the nodeid will be None and the flags will be the empty

612

the nodeid will be None and the flags will be the empty

613

string.

613

string.

614

"""

614

"""

615

if match:

615

if match:

616

m1 = self._matches(match)

616

m1 = self._matches(match)

617

m2 = m2._matches(match)

617

m2 = m2._matches(match)

618

return m1.diff(m2, clean=clean)

618

return m1.diff(m2, clean=clean)

619

return self._lm.diff(m2._lm, clean)

619

return self._lm.diff(m2._lm, clean)

620

621

def setflag(self, key, flag):

621

def setflag(self, key, flag):

622

if flag not in _manifestflags:

622

if flag not in _manifestflags:

623

raise TypeError(b"Invalid manifest flag set.")

623

raise TypeError(b"Invalid manifest flag set.")

624

self._lm[key] = self[key], flag

624

self._lm[key] = self[key], flag

625

626

def get(self, key, default=None):

626

def get(self, key, default=None):

627

try:

627

try:

628

return self._lm[key][0]

628

return self._lm[key][0]

629

except KeyError:

629

except KeyError:

630

return default

630

return default

631

632

def flags(self, key):

632

def flags(self, key):

633

try:

633

try:

634

return self._lm[key][1]

634

return self._lm[key][1]

635

except KeyError:

635

except KeyError:

636

return b''

636

return b''

637

638

def copy(self):

638

def copy(self):

639

c = manifestdict(self._nodelen)

639

c = manifestdict(self._nodelen)

640

c._lm = self._lm.copy()

640

c._lm = self._lm.copy()

641

return c

641

return c

642

643

def items(self):

643

def items(self):

644

return (x[:2] for x in self._lm.iterentries())

644

return (x[:2] for x in self._lm.iterentries())

645

646

def iteritems(self):

646

def iteritems(self):

647

return (x[:2] for x in self._lm.iterentries())

647

return (x[:2] for x in self._lm.iterentries())

648

649

def iterentries(self):

649

def iterentries(self):

650

return self._lm.iterentries()

650

return self._lm.iterentries()

651

652

def text(self):

652

def text(self):

653

# most likely uses native version

653

# most likely uses native version

654

return self._lm.text()

654

return self._lm.text()

655

656

def fastdelta(self, base, changes):

656

def fastdelta(self, base, changes):

657

"""Given a base manifest text as a bytearray and a list of changes

657

"""Given a base manifest text as a bytearray and a list of changes

658

relative to that text, compute a delta that can be used by revlog.

658

relative to that text, compute a delta that can be used by revlog.

659

"""

659

"""

660

delta = []

660

delta = []

661

dstart = None

661

dstart = None

662

dend = None

662

dend = None

663

dline = [b""]

663

dline = [b""]

664

start = 0

664

start = 0

665

# zero copy representation of base as a buffer

665

# zero copy representation of base as a buffer

666

addbuf = util.buffer(base)

666

addbuf = util.buffer(base)

667

668

changes = list(changes)

668

changes = list(changes)

669

if len(changes) < FASTDELTA_TEXTDIFF_THRESHOLD:

669

if len(changes) < FASTDELTA_TEXTDIFF_THRESHOLD:

670

# start with a readonly loop that finds the offset of

670

# start with a readonly loop that finds the offset of

671

# each line and creates the deltas

671

# each line and creates the deltas

672

for f, todelete in changes:

672

for f, todelete in changes:

673

# bs will either be the index of the item or the insert point

673

# bs will either be the index of the item or the insert point

674

start, end = _msearch(addbuf, f, start)

674

start, end = _msearch(addbuf, f, start)

675

if not todelete:

675

if not todelete:

676

h, fl = self._lm[f]

676

h, fl = self._lm[f]

677

l = b"%s\0%s%s\n" % (f, hex(h), fl)

677

l = b"%s\0%s%s\n" % (f, hex(h), fl)

678

else:

678

else:

679

if start == end:

679

if start == end:

680

# item we want to delete was not found, error out

680

# item we want to delete was not found, error out

681

raise AssertionError(

681

raise AssertionError(

682

_(b"failed to remove %s from manifest") % f

682

_(b"failed to remove %s from manifest") % f

683

)

683

)

684

l = b""

684

l = b""

685

if dstart is not None and dstart <= start and dend >= start:

685

if dstart is not None and dstart <= start and dend >= start:

686

if dend < end:

686

if dend < end:

687

dend = end

687

dend = end

688

if l:

688

if l:

689

dline.append(l)

689

dline.append(l)

690

else:

690

else:

691

if dstart is not None:

691

if dstart is not None:

692

delta.append([dstart, dend, b"".join(dline)])

692

delta.append([dstart, dend, b"".join(dline)])

693

dstart = start

693

dstart = start

694

dend = end

694

dend = end

695

dline = [l]

695

dline = [l]

696

697

if dstart is not None:

697

if dstart is not None:

698

delta.append([dstart, dend, b"".join(dline)])

698

delta.append([dstart, dend, b"".join(dline)])

699

# apply the delta to the base, and get a delta for addrevision

699

# apply the delta to the base, and get a delta for addrevision

700

deltatext, arraytext = _addlistdelta(base, delta)

700

deltatext, arraytext = _addlistdelta(base, delta)

701

else:

701

else:

702

# For large changes, it's much cheaper to just build the text and

702

# For large changes, it's much cheaper to just build the text and

703

# diff it.

703

# diff it.

704

arraytext = bytearray(self.text())

704

arraytext = bytearray(self.text())

705

deltatext = mdiff.textdiff(

705

deltatext = mdiff.textdiff(

706

util.buffer(base), util.buffer(arraytext)

706

util.buffer(base), util.buffer(arraytext)

707

)

707

)

708

709

return arraytext, deltatext

709

return arraytext, deltatext

710

711

712

def _msearch(m, s, lo=0, hi=None):

712

def _msearch(m, s, lo=0, hi=None):

713

"""return a tuple (start, end) that says where to find s within m.

713

"""return a tuple (start, end) that says where to find s within m.

714

715

If the string is found m[start:end] are the line containing

715

If the string is found m[start:end] are the line containing

716

that string. If start == end the string was not found and

716

that string. If start == end the string was not found and

717

they indicate the proper sorted insertion point.

717

they indicate the proper sorted insertion point.

718

719

m should be a buffer, a memoryview or a byte string.

719

m should be a buffer, a memoryview or a byte string.

720

s is a byte string"""

720

s is a byte string"""

721

722

def advance(i, c):

722

def advance(i, c):

723

while i < lenm and m[i : i + 1] != c:

723

while i < lenm and m[i : i + 1] != c:

724

i += 1

724

i += 1

725

return i

725

return i

726

727

if not s:

727

if not s:

728

return (lo, lo)

728

return (lo, lo)

729

lenm = len(m)

729

lenm = len(m)

730

if not hi:

730

if not hi:

731

hi = lenm

731

hi = lenm

732

while lo < hi:

732

while lo < hi:

733

mid = (lo + hi) // 2

733

mid = (lo + hi) // 2

734

start = mid

734

start = mid

735

while start > 0 and m[start - 1 : start] != b'\n':

735

while start > 0 and m[start - 1 : start] != b'\n':

736

start -= 1

736

start -= 1

737

end = advance(start, b'\0')

737

end = advance(start, b'\0')

738

if bytes(m[start:end]) < s:

738

if bytes(m[start:end]) < s:

739

# we know that after the null there are 40 bytes of sha1

739

# we know that after the null there are 40 bytes of sha1

740

# this translates to the bisect lo = mid + 1

740

# this translates to the bisect lo = mid + 1

741

lo = advance(end + 40, b'\n') + 1

741

lo = advance(end + 40, b'\n') + 1

742

else:

742

else:

743

# this translates to the bisect hi = mid

743

# this translates to the bisect hi = mid

744

hi = start

744

hi = start

745

end = advance(lo, b'\0')

745

end = advance(lo, b'\0')

746

found = m[lo:end]

746

found = m[lo:end]

747

if s == found:

747

if s == found:

748

# we know that after the null there are 40 bytes of sha1

748

# we know that after the null there are 40 bytes of sha1

749

end = advance(end + 40, b'\n')

749

end = advance(end + 40, b'\n')

750

return (lo, end + 1)

750

return (lo, end + 1)

751

else:

751

else:

752

return (lo, lo)

752

return (lo, lo)

753

754

755

def _checkforbidden(l):

755

def _checkforbidden(l):

756

"""Check filenames for illegal characters."""

756

"""Check filenames for illegal characters."""

757

for f in l:

757

for f in l:

758

if b'\n' in f or b'\r' in f:

758

if b'\n' in f or b'\r' in f:

759

raise error.StorageError(

759

raise error.StorageError(

760

_(b"'\\n' and '\\r' disallowed in filenames: %r")

760

_(b"'\\n' and '\\r' disallowed in filenames: %r")

761

% pycompat.bytestr(f)

761

% pycompat.bytestr(f)

762

)

762

)

763

764

765

# apply the changes collected during the bisect loop to our addlist

765

# apply the changes collected during the bisect loop to our addlist

766

# return a delta suitable for addrevision

766

# return a delta suitable for addrevision

767

def _addlistdelta(addlist, x):

767

def _addlistdelta(addlist, x):

768

# for large addlist arrays, building a new array is cheaper

768

# for large addlist arrays, building a new array is cheaper

769

# than repeatedly modifying the existing one

769

# than repeatedly modifying the existing one

770

currentposition = 0

770

currentposition = 0

771

newaddlist = bytearray()

771

newaddlist = bytearray()

772

773

for start, end, content in x:

773

for start, end, content in x:

774

newaddlist += addlist[currentposition:start]

774

newaddlist += addlist[currentposition:start]

775

if content:

775

if content:

776

newaddlist += bytearray(content)

776

newaddlist += bytearray(content)

777

778

currentposition = end

778

currentposition = end

779

780

newaddlist += addlist[currentposition:]

780

newaddlist += addlist[currentposition:]

781

782

deltatext = b"".join(

782

deltatext = b"".join(

783

struct.pack(b">lll", start, end, len(content)) + content

783

struct.pack(b">lll", start, end, len(content)) + content

784

for start, end, content in x

784

for start, end, content in x

785

)

785

)

786

return deltatext, newaddlist

786

return deltatext, newaddlist

787

788

789

def _splittopdir(f):

789

def _splittopdir(f):

790

if b'/' in f:

790

if b'/' in f:

791

dir, subpath = f.split(b'/', 1)

791

dir, subpath = f.split(b'/', 1)

792

return dir + b'/', subpath

792

return dir + b'/', subpath

793

else:

793

else:

794

return b'', f

794

return b'', f

795

796

797

_noop = lambda s: None

797

_noop = lambda s: None

798

799

800

@interfaceutil.implementer(repository.imanifestdict)

800

@interfaceutil.implementer(repository.imanifestdict)

801

class treemanifest:

801

class treemanifest:

802

def __init__(self, nodeconstants, dir=b'', text=b''):

802

def __init__(self, nodeconstants, dir=b'', text=b''):

803

self._dir = dir

803

self._dir = dir

804

self.nodeconstants = nodeconstants

804

self.nodeconstants = nodeconstants

805

self._node = self.nodeconstants.nullid

805

self._node = self.nodeconstants.nullid

806

self._nodelen = self.nodeconstants.nodelen

806

self._nodelen = self.nodeconstants.nodelen

807

self._loadfunc = _noop

807

self._loadfunc = _noop

808

self._copyfunc = _noop

808

self._copyfunc = _noop

809

self._dirty = False

809

self._dirty = False

810

self._dirs = {}

810

self._dirs = {}

811

self._lazydirs = {}

811

self._lazydirs = {}

812

# Using _lazymanifest here is a little slower than plain old dicts

812

# Using _lazymanifest here is a little slower than plain old dicts

813

self._files = {}

813

self._files = {}

814

self._flags = {}

814

self._flags = {}

815

if text:

815

if text:

816

817

def readsubtree(subdir, subm):

817

def readsubtree(subdir, subm):

818

raise AssertionError(

818

raise AssertionError(

819

b'treemanifest constructor only accepts flat manifests'

819

b'treemanifest constructor only accepts flat manifests'

820

)

820

)

821

822

self.parse(text, readsubtree)

822

self.parse(text, readsubtree)

823

self._dirty = True # Mark flat manifest dirty after parsing

823

self._dirty = True # Mark flat manifest dirty after parsing

824

825

def _subpath(self, path):

825

def _subpath(self, path):

826

return self._dir + path

826

return self._dir + path

827

828

def _loadalllazy(self):

828

def _loadalllazy(self):

829

selfdirs = self._dirs

829

selfdirs = self._dirs

830

subpath = self._subpath

830

subpath = self._subpath

831

for d, (node, readsubtree, docopy) in self._lazydirs.items():

831

for d, (node, readsubtree, docopy) in self._lazydirs.items():

832

if docopy:

832

if docopy:

833

selfdirs[d] = readsubtree(subpath(d), node).copy()

833

selfdirs[d] = readsubtree(subpath(d), node).copy()

834

else:

834

else:

835

selfdirs[d] = readsubtree(subpath(d), node)

835

selfdirs[d] = readsubtree(subpath(d), node)

836

self._lazydirs = {}

836

self._lazydirs = {}

837

838

def _loadlazy(self, d):

838

def _loadlazy(self, d):

839

v = self._lazydirs.get(d)

839

v = self._lazydirs.get(d)

840

if v:

840

if v:

841

node, readsubtree, docopy = v

841

node, readsubtree, docopy = v

842

if docopy:

842

if docopy:

843

self._dirs[d] = readsubtree(self._subpath(d), node).copy()

843

self._dirs[d] = readsubtree(self._subpath(d), node).copy()

844

else:

844

else:

845

self._dirs[d] = readsubtree(self._subpath(d), node)

845

self._dirs[d] = readsubtree(self._subpath(d), node)

846

del self._lazydirs[d]

846

del self._lazydirs[d]

847

848

def _loadchildrensetlazy(self, visit):

848

def _loadchildrensetlazy(self, visit):

849

if not visit:

849

if not visit:

850

return None

850

return None

851

if visit == b'all' or visit == b'this':

851

if visit == b'all' or visit == b'this':

852

self._loadalllazy()

852

self._loadalllazy()

853

return None

853

return None

854

855

loadlazy = self._loadlazy

855

loadlazy = self._loadlazy

856

for k in visit:

856

for k in visit:

857

loadlazy(k + b'/')

857

loadlazy(k + b'/')

858

return visit

858

return visit

859

860

def _loaddifflazy(self, t1, t2):

860

def _loaddifflazy(self, t1, t2):

861

"""load items in t1 and t2 if they're needed for diffing.

861

"""load items in t1 and t2 if they're needed for diffing.

862

863

The criteria currently is:

863

The criteria currently is:

864

- if it's not present in _lazydirs in either t1 or t2, load it in the

864

- if it's not present in _lazydirs in either t1 or t2, load it in the

865

other (it may already be loaded or it may not exist, doesn't matter)

865

other (it may already be loaded or it may not exist, doesn't matter)

866

- if it's present in _lazydirs in both, compare the nodeid; if it

866

- if it's present in _lazydirs in both, compare the nodeid; if it

867

differs, load it in both

867

differs, load it in both

868

"""

868

"""

869

toloadlazy = []

869

toloadlazy = []

870

for d, v1 in t1._lazydirs.items():

870

for d, v1 in t1._lazydirs.items():

871

v2 = t2._lazydirs.get(d)

871

v2 = t2._lazydirs.get(d)

872

if not v2 or v2[0] != v1[0]:

872

if not v2 or v2[0] != v1[0]:

873

toloadlazy.append(d)

873

toloadlazy.append(d)

874

for d, v1 in t2._lazydirs.items():

874

for d, v1 in t2._lazydirs.items():

875

if d not in t1._lazydirs:

875

if d not in t1._lazydirs:

876

toloadlazy.append(d)

876

toloadlazy.append(d)

877

878

for d in toloadlazy:

878

for d in toloadlazy:

879

t1._loadlazy(d)

879

t1._loadlazy(d)

880

t2._loadlazy(d)

880

t2._loadlazy(d)

881

882

def __len__(self):

882

def __len__(self):

883

self._load()

883

self._load()

884

size = len(self._files)

884

size = len(self._files)

885

self._loadalllazy()

885

self._loadalllazy()

886

for m in self._dirs.values():

886

for m in self._dirs.values():

887

size += m.__len__()

887

size += m.__len__()

888

return size

888

return size

889

890

def __nonzero__(self):

890

def __nonzero__(self):

891

# Faster than "__len() != 0" since it avoids loading sub-manifests

891

# Faster than "__len() != 0" since it avoids loading sub-manifests

892

return not self._isempty()

892

return not self._isempty()

893

894

__bool__ = __nonzero__

894

__bool__ = __nonzero__

895

896

def _isempty(self):

896

def _isempty(self):

897

self._load() # for consistency; already loaded by all callers

897

self._load() # for consistency; already loaded by all callers

898

# See if we can skip loading everything.

898

# See if we can skip loading everything.

899

if self._files or (

899

if self._files or (

900

self._dirs and any(not m._isempty() for m in self._dirs.values())

900

self._dirs and any(not m._isempty() for m in self._dirs.values())

901

):

901

):

902

return False

902

return False

903

self._loadalllazy()

903

self._loadalllazy()

904

return not self._dirs or all(m._isempty() for m in self._dirs.values())

904

return not self._dirs or all(m._isempty() for m in self._dirs.values())

905

906

@encoding.strmethod

906

@encoding.strmethod

907

def __repr__(self):

907

def __repr__(self):

908

return (

908

return (

909

b'<treemanifest dir=%s, node=%s, loaded=%r, dirty=%r at 0x%x>'

909

b'<treemanifest dir=%s, node=%s, loaded=%r, dirty=%r at 0x%x>'

910

% (

910

% (

911

self._dir,

911

self._dir,

912

hex(self._node),

912

hex(self._node),

913

bool(self._loadfunc is _noop),

913

bool(self._loadfunc is _noop),

914

self._dirty,

914

self._dirty,

915

id(self),

915

id(self),

916

)

916

)

917

)

917

)

918

919

def dir(self):

919

def dir(self):

920

"""The directory that this tree manifest represents, including a

920

"""The directory that this tree manifest represents, including a

921

trailing '/'. Empty string for the repo root directory."""

921

trailing '/'. Empty string for the repo root directory."""

922

return self._dir

922

return self._dir

923

924

def node(self):

924

def node(self):

925

"""This node of this instance. nullid for unsaved instances. Should

925

"""This node of this instance. nullid for unsaved instances. Should

926

be updated when the instance is read or written from a revlog.

926

be updated when the instance is read or written from a revlog.

927

"""

927

"""

928

assert not self._dirty

928

assert not self._dirty

929

return self._node

929

return self._node

930

931

def setnode(self, node):

931

def setnode(self, node):

932

self._node = node

932

self._node = node

933

self._dirty = False

933

self._dirty = False

934

935

def iterentries(self):

935

def iterentries(self):

936

self._load()

936

self._load()

937

self._loadalllazy()

937

self._loadalllazy()

938

for p, n in sorted(

938

for p, n in sorted(

939

itertools.chain(self._dirs.items(), self._files.items())

939

itertools.chain(self._dirs.items(), self._files.items())

940

):

940

):

941

if p in self._files:

941

if p in self._files:

942

yield self._subpath(p), n, self._flags.get(p, b'')

942

yield self._subpath(p), n, self._flags.get(p, b'')

943

else:

943

else:

944

for x in n.iterentries():

944

for x in n.iterentries():

945

yield x

945

yield x

946

947

def items(self):

947

def items(self):

948

self._load()

948

self._load()

949

self._loadalllazy()

949

self._loadalllazy()

950

for p, n in sorted(

950

for p, n in sorted(

951

itertools.chain(self._dirs.items(), self._files.items())

951

itertools.chain(self._dirs.items(), self._files.items())

952

):

952

):

953

if p in self._files:

953

if p in self._files:

954

yield self._subpath(p), n

954

yield self._subpath(p), n

955

else:

955

else:

956

for f, sn in n.items():

956

for f, sn in n.items():

957

yield f, sn

957

yield f, sn

958

959

iteritems = items

959

iteritems = items

960

961

def iterkeys(self):

961

def iterkeys(self):

962

self._load()

962

self._load()

963

self._loadalllazy()

963

self._loadalllazy()

964

for p in sorted(itertools.chain(self._dirs, self._files)):

964

for p in sorted(itertools.chain(self._dirs, self._files)):

965

if p in self._files:

965

if p in self._files:

966

yield self._subpath(p)

966

yield self._subpath(p)

967

else:

967

else:

968

for f in self._dirs[p]:

968

for f in self._dirs[p]:

969

yield f

969

yield f

970

971

def keys(self):

971

def keys(self):

972

return list(self.iterkeys())

972

return list(self.iterkeys())

973

974

def __iter__(self):

974

def __iter__(self):

975

return self.iterkeys()

975

return self.iterkeys()

976

977

def __contains__(self, f):

977

def __contains__(self, f):

978

if f is None:

978

if f is None:

979

return False

979

return False

980

self._load()

980

self._load()

981

dir, subpath = _splittopdir(f)

981

dir, subpath = _splittopdir(f)

982

if dir:

982

if dir:

983

self._loadlazy(dir)

983

self._loadlazy(dir)

984

985

if dir not in self._dirs:

985

if dir not in self._dirs:

986

return False

986

return False

987

988

return self._dirs[dir].__contains__(subpath)

988

return self._dirs[dir].__contains__(subpath)

989

else:

989

else:

990

return f in self._files

990

return f in self._files

991

992

def get(self, f, default=None):

992

def get(self, f, default=None):

993

self._load()

993

self._load()

994

dir, subpath = _splittopdir(f)

994

dir, subpath = _splittopdir(f)

995

if dir:

995

if dir:

996

self._loadlazy(dir)

996

self._loadlazy(dir)

997

998

if dir not in self._dirs:

998

if dir not in self._dirs:

999

return default

999

return default

1000

return self._dirs[dir].get(subpath, default)

1000

return self._dirs[dir].get(subpath, default)

1001

else:

1001

else:

1002

return self._files.get(f, default)

1002

return self._files.get(f, default)

1003

1004

def __getitem__(self, f):

1004

def __getitem__(self, f):

1005

self._load()

1005

self._load()

1006

dir, subpath = _splittopdir(f)

1006

dir, subpath = _splittopdir(f)

1007

if dir:

1007

if dir:

1008

self._loadlazy(dir)

1008

self._loadlazy(dir)

1009

1010

return self._dirs[dir].__getitem__(subpath)

1010

return self._dirs[dir].__getitem__(subpath)

1011

else:

1011

else:

1012

return self._files[f]

1012

return self._files[f]

1013

1014

def flags(self, f):

1014

def flags(self, f):

1015

self._load()

1015

self._load()

1016

dir, subpath = _splittopdir(f)

1016

dir, subpath = _splittopdir(f)

1017

if dir:

1017

if dir:

1018

self._loadlazy(dir)

1018

self._loadlazy(dir)

1019

1020

if dir not in self._dirs:

1020

if dir not in self._dirs:

1021

return b''

1021

return b''

1022

return self._dirs[dir].flags(subpath)

1022

return self._dirs[dir].flags(subpath)

1023

else:

1023

else:

1024

if f in self._lazydirs or f in self._dirs:

1024

if f in self._lazydirs or f in self._dirs:

1025

return b''

1025

return b''

1026

return self._flags.get(f, b'')

1026

return self._flags.get(f, b'')

1027

1028

def find(self, f):

1028

def find(self, f):

1029

self._load()

1029

self._load()

1030

dir, subpath = _splittopdir(f)

1030

dir, subpath = _splittopdir(f)

1031

if dir:

1031

if dir:

1032

self._loadlazy(dir)

1032

self._loadlazy(dir)

1033

1034

return self._dirs[dir].find(subpath)

1034

return self._dirs[dir].find(subpath)

1035

else:

1035

else:

1036

return self._files[f], self._flags.get(f, b'')

1036

return self._files[f], self._flags.get(f, b'')

1037

1038

def __delitem__(self, f):

1038

def __delitem__(self, f):

1039

self._load()

1039

self._load()

1040

dir, subpath = _splittopdir(f)

1040

dir, subpath = _splittopdir(f)

1041

if dir:

1041

if dir:

1042

self._loadlazy(dir)

1042

self._loadlazy(dir)

1043

1044

self._dirs[dir].__delitem__(subpath)

1044

self._dirs[dir].__delitem__(subpath)

1045

# If the directory is now empty, remove it

1045

# If the directory is now empty, remove it

1046

if self._dirs[dir]._isempty():

1046

if self._dirs[dir]._isempty():

1047

del self._dirs[dir]

1047

del self._dirs[dir]

1048

else:

1048

else:

1049

del self._files[f]

1049

del self._files[f]

1050

if f in self._flags:

1050

if f in self._flags:

1051

del self._flags[f]

1051

del self._flags[f]

1052

self._dirty = True

1052

self._dirty = True

1053

1054

def set(self, f, node, flags):

1054

def set(self, f, node, flags):

1055

"""Set both the node and the flags for path f."""

1055

"""Set both the node and the flags for path f."""

1056

assert node is not None

1056

assert node is not None

1057

if flags not in _manifestflags:

1057

if flags not in _manifestflags:

1058

raise TypeError(b"Invalid manifest flag set.")

1058

raise TypeError(b"Invalid manifest flag set.")

1059

self._load()

1059

self._load()

1060

dir, subpath = _splittopdir(f)

1060

dir, subpath = _splittopdir(f)

1061

if dir:

1061

if dir:

1062

self._loadlazy(dir)

1062

self._loadlazy(dir)

1063

if dir not in self._dirs:

1063

if dir not in self._dirs:

1064

self._dirs[dir] = treemanifest(

1064

self._dirs[dir] = treemanifest(

1065

self.nodeconstants, self._subpath(dir)

1065

self.nodeconstants, self._subpath(dir)

1066

)

1066

)

1067

self._dirs[dir].set(subpath, node, flags)

1067

self._dirs[dir].set(subpath, node, flags)

1068

else:

1068

else:

1069

assert len(node) in (20, 32)

1069

assert len(node) in (20, 32)

1070

self._files[f] = node

1070

self._files[f] = node

1071

self._flags[f] = flags

1071

self._flags[f] = flags

1072

self._dirty = True

1072

self._dirty = True

1073

1074

def __setitem__(self, f, n):

1074

def __setitem__(self, f, n):

1075

assert n is not None

1075

assert n is not None

1076

self._load()

1076

self._load()

1077

dir, subpath = _splittopdir(f)

1077

dir, subpath = _splittopdir(f)

1078

if dir:

1078

if dir:

1079

self._loadlazy(dir)

1079

self._loadlazy(dir)

1080

if dir not in self._dirs:

1080

if dir not in self._dirs:

1081

self._dirs[dir] = treemanifest(

1081

self._dirs[dir] = treemanifest(

1082

self.nodeconstants, self._subpath(dir)

1082

self.nodeconstants, self._subpath(dir)

1083

)

1083

)

1084

self._dirs[dir].__setitem__(subpath, n)

1084

self._dirs[dir].__setitem__(subpath, n)

1085

else:

1085

else:

1086

# manifest nodes are either 20 bytes or 32 bytes,

1086

# manifest nodes are either 20 bytes or 32 bytes,

1087

# depending on the hash in use. Assert this as historically

1087

# depending on the hash in use. Assert this as historically

1088

# sometimes extra bytes were added.

1088

# sometimes extra bytes were added.

1089

assert len(n) in (20, 32)

1089

assert len(n) in (20, 32)

1090

self._files[f] = n

1090

self._files[f] = n

1091

self._dirty = True

1091

self._dirty = True

1092

1093

def _load(self):

1093

def _load(self):

1094

if self._loadfunc is not _noop:

1094

if self._loadfunc is not _noop:

1095

lf, self._loadfunc = self._loadfunc, _noop

1095

lf, self._loadfunc = self._loadfunc, _noop

1096

lf(self)

1096

lf(self)

1097

elif self._copyfunc is not _noop:

1097

elif self._copyfunc is not _noop:

1098

cf, self._copyfunc = self._copyfunc, _noop

1098

cf, self._copyfunc = self._copyfunc, _noop

1099

cf(self)

1099

cf(self)

1100

1101

def setflag(self, f, flags):

1101

def setflag(self, f, flags):

1102

"""Set the flags (symlink, executable) for path f."""

1102

"""Set the flags (symlink, executable) for path f."""

1103

if flags not in _manifestflags:

1103

if flags not in _manifestflags:

1104

raise TypeError(b"Invalid manifest flag set.")

1104

raise TypeError(b"Invalid manifest flag set.")

1105

self._load()

1105

self._load()

1106

dir, subpath = _splittopdir(f)

1106

dir, subpath = _splittopdir(f)

1107

if dir:

1107

if dir:

1108

self._loadlazy(dir)

1108

self._loadlazy(dir)

1109

if dir not in self._dirs:

1109

if dir not in self._dirs:

1110

self._dirs[dir] = treemanifest(

1110

self._dirs[dir] = treemanifest(

1111

self.nodeconstants, self._subpath(dir)

1111

self.nodeconstants, self._subpath(dir)

1112

)

1112

)

1113

self._dirs[dir].setflag(subpath, flags)

1113

self._dirs[dir].setflag(subpath, flags)

1114

else:

1114

else:

1115

self._flags[f] = flags

1115

self._flags[f] = flags

1116

self._dirty = True

1116

self._dirty = True

1117

1118

def copy(self):

1118

def copy(self):

1119

copy = treemanifest(self.nodeconstants, self._dir)

1119

copy = treemanifest(self.nodeconstants, self._dir)

1120

copy._node = self._node

1120

copy._node = self._node

1121

copy._dirty = self._dirty

1121

copy._dirty = self._dirty

1122

if self._copyfunc is _noop:

1122

if self._copyfunc is _noop:

1123

1124

def _copyfunc(s):

1124

def _copyfunc(s):

1125

self._load()

1125

self._load()

1126

s._lazydirs = {

1126

s._lazydirs = {

1127

d: (n, r, True) for d, (n, r, c) in self._lazydirs.items()

1127

d: (n, r, True) for d, (n, r, c) in self._lazydirs.items()

1128

}

1128

}

1129

sdirs = s._dirs

1129

sdirs = s._dirs

1130

for d, v in self._dirs.items():

1130

for d, v in self._dirs.items():

1131

sdirs[d] = v.copy()

1131

sdirs[d] = v.copy()

1132

s._files = dict.copy(self._files)

1132

s._files = dict.copy(self._files)

1133

s._flags = dict.copy(self._flags)

1133

s._flags = dict.copy(self._flags)

1134

1135

if self._loadfunc is _noop:

1135

if self._loadfunc is _noop:

1136

_copyfunc(copy)

1136

_copyfunc(copy)

1137

else:

1137

else:

1138

copy._copyfunc = _copyfunc

1138

copy._copyfunc = _copyfunc

1139

else:

1139

else:

1140

copy._copyfunc = self._copyfunc

1140

copy._copyfunc = self._copyfunc

1141

return copy

1141

return copy

1142

1143

def filesnotin(self, m2, match=None):

1143

def filesnotin(self, m2, match=None):

1144

'''Set of files in this manifest that are not in the other'''

1144

'''Set of files in this manifest that are not in the other'''

1145

if match and not match.always():

1145

if match and not match.always():

1146

m1 = self._matches(match)

1146

m1 = self._matches(match)

1147

m2 = m2._matches(match)

1147

m2 = m2._matches(match)

1148

return m1.filesnotin(m2)

1148

return m1.filesnotin(m2)

1149

1150

files = set()

1150

files = set()

1151

1152

def _filesnotin(t1, t2):

1152

def _filesnotin(t1, t2):

1153

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1153

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1154

return

1154

return

1155

t1._load()

1155

t1._load()

1156

t2._load()

1156

t2._load()

1157

self._loaddifflazy(t1, t2)

1157

self._loaddifflazy(t1, t2)

1158

for d, m1 in t1._dirs.items():

1158

for d, m1 in t1._dirs.items():

1159

if d in t2._dirs:

1159

if d in t2._dirs:

1160

m2 = t2._dirs[d]

1160

m2 = t2._dirs[d]

1161

_filesnotin(m1, m2)

1161

_filesnotin(m1, m2)

1162

else:

1162

else:

1163

files.update(m1.iterkeys())

1163

files.update(m1.iterkeys())

1164

1165

for fn in t1._files:

1165

for fn in t1._files:

1166

if fn not in t2._files:

1166

if fn not in t2._files:

1167

files.add(t1._subpath(fn))

1167

files.add(t1._subpath(fn))

1168

1169

_filesnotin(self, m2)

1169

_filesnotin(self, m2)

1170

return files

1170

return files

1171

1172

@propertycache

1172

@propertycache

1173

def _alldirs(self):

1173

def _alldirs(self):

1174

return pathutil.dirs(self)

1174

return pathutil.dirs(self)

1175

1176

def dirs(self):

1176

def dirs(self):

1177

return self._alldirs

1177

return self._alldirs

1178

1179

def hasdir(self, dir):

1179

def hasdir(self, dir):

1180

self._load()

1180

self._load()

1181

topdir, subdir = _splittopdir(dir)

1181

topdir, subdir = _splittopdir(dir)

1182

if topdir:

1182

if topdir:

1183

self._loadlazy(topdir)

1183

self._loadlazy(topdir)

1184

if topdir in self._dirs:

1184

if topdir in self._dirs:

1185

return self._dirs[topdir].hasdir(subdir)

1185

return self._dirs[topdir].hasdir(subdir)

1186

return False

1186

return False

1187

dirslash = dir + b'/'

1187

dirslash = dir + b'/'

1188

return dirslash in self._dirs or dirslash in self._lazydirs

1188

return dirslash in self._dirs or dirslash in self._lazydirs

1189

1190

def walk(self, match):

1190

def walk(self, match):

1191

"""Generates matching file names.

1191

"""Generates matching file names.

1192

1193

It also reports nonexistent files by marking them bad with match.bad().

1193

It also reports nonexistent files by marking them bad with match.bad().

1194

"""

1194

"""

1195

if match.always():

1195

if match.always():

1196

for f in iter(self):

1196

for f in iter(self):

1197

yield f

1197

yield f

1198

return

1198

return

1199

1200

fset = set(match.files())

1200

fset = set(match.files())

1201

1202

for fn in self._walk(match):

1202

for fn in self._walk(match):

1203

if fn in fset:

1203

if fn in fset:

1204

# specified pattern is the exact name

1204

# specified pattern is the exact name

1205

fset.remove(fn)

1205

fset.remove(fn)

1206

yield fn

1206

yield fn

1207

1208

# for dirstate.walk, files=[''] means "walk the whole tree".

1208

# for dirstate.walk, files=[''] means "walk the whole tree".

1209

# follow that here, too

1209

# follow that here, too

1210

fset.discard(b'')

1210

fset.discard(b'')

1211

1212

for fn in sorted(fset):

1212

for fn in sorted(fset):

1213

if not self.hasdir(fn):

1213

if not self.hasdir(fn):

1214

match.bad(fn, None)

1214

match.bad(fn, None)

1215

1216

def _walk(self, match):

1216

def _walk(self, match):

1217

'''Recursively generates matching file names for walk().'''

1217

'''Recursively generates matching file names for walk().'''

1218

visit = match.visitchildrenset(self._dir[:-1])

1218

visit = match.visitchildrenset(self._dir[:-1])

1219

if not visit:

1219

if not visit:

1220

return

1220

return

1221

1222

# yield this dir's files and walk its submanifests

1222

# yield this dir's files and walk its submanifests

1223

self._load()

1223

self._load()

1224

visit = self._loadchildrensetlazy(visit)

1224

visit = self._loadchildrensetlazy(visit)

1225

for p in sorted(list(self._dirs) + list(self._files)):

1225

for p in sorted(list(self._dirs) + list(self._files)):

1226

if p in self._files:

1226

if p in self._files:

1227

fullp = self._subpath(p)

1227

fullp = self._subpath(p)

1228

if match(fullp):

1228

if match(fullp):

1229

yield fullp

1229

yield fullp

1230

else:

1230

else:

1231

if not visit or p[:-1] in visit:

1231

if not visit or p[:-1] in visit:

1232

for f in self._dirs[p]._walk(match):

1232

for f in self._dirs[p]._walk(match):

1233

yield f

1233

yield f

1234

1235

def _matches(self, match):

1235

def _matches(self, match):

1236

"""recursively generate a new manifest filtered by the match argument."""

1236

"""recursively generate a new manifest filtered by the match argument."""

1237

if match.always():

1237

if match.always():

1238

return self.copy()

1238

return self.copy()

1239

return self._matches_inner(match)

1239

return self._matches_inner(match)

1240

1241

def _matches_inner(self, match):

1241

def _matches_inner(self, match):

1242

if match.always():

1242

if match.always():

1243

return self.copy()

1243

return self.copy()

1244

1245

visit = match.visitchildrenset(self._dir[:-1])

1245

visit = match.visitchildrenset(self._dir[:-1])

1246

if visit == b'all':

1246

if visit == b'all':

1247

return self.copy()

1247

return self.copy()

1248

ret = treemanifest(self.nodeconstants, self._dir)

1248

ret = treemanifest(self.nodeconstants, self._dir)

1249

if not visit:

1249

if not visit:

1250

return ret

1250

return ret

1251

1252

self._load()

1252

self._load()

1253

for fn in self._files:

1253

for fn in self._files:

1254

# While visitchildrenset *usually* lists only subdirs, this is

1254

# While visitchildrenset *usually* lists only subdirs, this is

1255

# actually up to the matcher and may have some files in the set().

1255

# actually up to the matcher and may have some files in the set().

1256

# If visit == 'this', we should obviously look at the files in this

1256

# If visit == 'this', we should obviously look at the files in this

1257

# directory; if visit is a set, and fn is in it, we should inspect

1257

# directory; if visit is a set, and fn is in it, we should inspect

1258

# fn (but no need to inspect things not in the set).

1258

# fn (but no need to inspect things not in the set).

1259

if visit != b'this' and fn not in visit:

1259

if visit != b'this' and fn not in visit:

1260

continue

1260

continue

1261

fullp = self._subpath(fn)

1261

fullp = self._subpath(fn)

1262

# visitchildrenset isn't perfect, we still need to call the regular

1262

# visitchildrenset isn't perfect, we still need to call the regular

1263

# matcher code to further filter results.

1263

# matcher code to further filter results.

1264

if not match(fullp):

1264

if not match(fullp):

1265

continue

1265

continue

1266

ret._files[fn] = self._files[fn]

1266

ret._files[fn] = self._files[fn]

1267

if fn in self._flags:

1267

if fn in self._flags:

1268

ret._flags[fn] = self._flags[fn]

1268

ret._flags[fn] = self._flags[fn]

1269

1270

visit = self._loadchildrensetlazy(visit)

1270

visit = self._loadchildrensetlazy(visit)

1271

for dir, subm in self._dirs.items():

1271

for dir, subm in self._dirs.items():

1272

if visit and dir[:-1] not in visit:

1272

if visit and dir[:-1] not in visit:

1273

continue

1273

continue

1274

m = subm._matches_inner(match)

1274

m = subm._matches_inner(match)

1275

if not m._isempty():

1275

if not m._isempty():

1276

ret._dirs[dir] = m

1276

ret._dirs[dir] = m

1277

1278

if not ret._isempty():

1278

if not ret._isempty():

1279

ret._dirty = True

1279

ret._dirty = True

1280

return ret

1280

return ret

1281

1282

def fastdelta(self, base, changes):

1282

def fastdelta(self, base, changes):

1283

raise FastdeltaUnavailable()

1283

raise FastdeltaUnavailable()

1284

1285

def diff(self, m2, match=None, clean=False):

1285

def diff(self, m2, match=None, clean=False):

1286

"""Finds changes between the current manifest and m2.

1286

"""Finds changes between the current manifest and m2.

1287

1288

Args:

1288

Args:

1289

m2: the manifest to which this manifest should be compared.

1289

m2: the manifest to which this manifest should be compared.

1290

clean: if true, include files unchanged between these manifests

1290

clean: if true, include files unchanged between these manifests

1291

with a None value in the returned dictionary.

1291

with a None value in the returned dictionary.

1292

1293

The result is returned as a dict with filename as key and

1293

The result is returned as a dict with filename as key and

1294

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

1294

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

1295

nodeid in the current/other manifest and fl1/fl2 is the flag

1295

nodeid in the current/other manifest and fl1/fl2 is the flag

1296

in the current/other manifest. Where the file does not exist,

1296

in the current/other manifest. Where the file does not exist,

1297

the nodeid will be None and the flags will be the empty

1297

the nodeid will be None and the flags will be the empty

1298

string.

1298

string.

1299

"""

1299

"""

1300

if match and not match.always():

1300

if match and not match.always():

1301

m1 = self._matches(match)

1301

m1 = self._matches(match)

1302

m2 = m2._matches(match)

1302

m2 = m2._matches(match)

1303

return m1.diff(m2, clean=clean)

1303

return m1.diff(m2, clean=clean)

1304

result = {}

1304

result = {}

1305

emptytree = treemanifest(self.nodeconstants)

1305

emptytree = treemanifest(self.nodeconstants)

1306

1307

def _iterativediff(t1, t2, stack):

1307

def _iterativediff(t1, t2, stack):

1308

"""compares two tree manifests and append new tree-manifests which

1308

"""compares two tree manifests and append new tree-manifests which

1309

needs to be compared to stack"""

1309

needs to be compared to stack"""

1310

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1310

if t1._node == t2._node and not t1._dirty and not t2._dirty:

1311

return

1311

return

1312

t1._load()

1312

t1._load()

1313

t2._load()

1313

t2._load()

1314

self._loaddifflazy(t1, t2)

1314

self._loaddifflazy(t1, t2)

1315

1316

for d, m1 in t1._dirs.items():

1316

for d, m1 in t1._dirs.items():

1317

m2 = t2._dirs.get(d, emptytree)

1317

m2 = t2._dirs.get(d, emptytree)

1318

stack.append((m1, m2))

1318

stack.append((m1, m2))

1319

1320

for d, m2 in t2._dirs.items():

1320

for d, m2 in t2._dirs.items():

1321

if d not in t1._dirs:

1321

if d not in t1._dirs:

1322

stack.append((emptytree, m2))

1322

stack.append((emptytree, m2))

1323

1324

for fn, n1 in t1._files.items():

1324

for fn, n1 in t1._files.items():

1325

fl1 = t1._flags.get(fn, b'')

1325

fl1 = t1._flags.get(fn, b'')

1326

n2 = t2._files.get(fn, None)

1326

n2 = t2._files.get(fn, None)

1327

fl2 = t2._flags.get(fn, b'')

1327

fl2 = t2._flags.get(fn, b'')

1328

if n1 != n2 or fl1 != fl2:

1328

if n1 != n2 or fl1 != fl2:

1329

result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))

1329

result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))

1330

elif clean:

1330

elif clean:

1331

result[t1._subpath(fn)] = None

1331

result[t1._subpath(fn)] = None

1332

1333

for fn, n2 in t2._files.items():

1333

for fn, n2 in t2._files.items():

1334

if fn not in t1._files:

1334

if fn not in t1._files:

1335

fl2 = t2._flags.get(fn, b'')

1335

fl2 = t2._flags.get(fn, b'')

1336

result[t2._subpath(fn)] = ((None, b''), (n2, fl2))

1336

result[t2._subpath(fn)] = ((None, b''), (n2, fl2))

1337

1338

stackls = []

1338

stackls = []

1339

_iterativediff(self, m2, stackls)

1339

_iterativediff(self, m2, stackls)

1340

while stackls:

1340

while stackls:

1341

t1, t2 = stackls.pop()

1341

t1, t2 = stackls.pop()

1342

# stackls is populated in the function call

1342

# stackls is populated in the function call

1343

_iterativediff(t1, t2, stackls)

1343

_iterativediff(t1, t2, stackls)

1344

return result

1344

return result

1345

1346

def unmodifiedsince(self, m2):

1346

def unmodifiedsince(self, m2):

1347

return not self._dirty and not m2._dirty and self._node == m2._node

1347

return not self._dirty and not m2._dirty and self._node == m2._node

1348

1349

def parse(self, text, readsubtree):

1349

def parse(self, text, readsubtree):

1350

selflazy = self._lazydirs

1350

selflazy = self._lazydirs

1351

for f, n, fl in _parse(self._nodelen, text):

1351

for f, n, fl in _parse(self._nodelen, text):

1352

if fl == b't':

1352

if fl == b't':

1353

f = f + b'/'

1353

f = f + b'/'

1354

# False below means "doesn't need to be copied" and can use the

1354

# False below means "doesn't need to be copied" and can use the

1355

# cached value from readsubtree directly.

1355

# cached value from readsubtree directly.

1356

selflazy[f] = (n, readsubtree, False)

1356

selflazy[f] = (n, readsubtree, False)

1357

elif b'/' in f:

1357

elif b'/' in f:

1358

# This is a flat manifest, so use __setitem__ and setflag rather

1358

# This is a flat manifest, so use __setitem__ and setflag rather

1359

# than assigning directly to _files and _flags, so we can

1359

# than assigning directly to _files and _flags, so we can

1360

# assign a path in a subdirectory, and to mark dirty (compared

1360

# assign a path in a subdirectory, and to mark dirty (compared

1361

# to nullid).

1361

# to nullid).

1362

self[f] = n

1362

self[f] = n

1363

if fl:

1363

if fl:

1364

self.setflag(f, fl)

1364

self.setflag(f, fl)

1365

else:

1365

else:

1366

# Assigning to _files and _flags avoids marking as dirty,

1366

# Assigning to _files and _flags avoids marking as dirty,

1367

# and should be a little faster.

1367

# and should be a little faster.

1368

self._files[f] = n

1368

self._files[f] = n

1369

if fl:

1369

if fl:

1370

self._flags[f] = fl

1370

self._flags[f] = fl

1371

1372

def text(self):

1372

def text(self):

1373

"""Get the full data of this manifest as a bytestring."""

1373

"""Get the full data of this manifest as a bytestring."""

1374

self._load()

1374

self._load()

1375

return _text(self.iterentries())

1375

return _text(self.iterentries())

1376

1377

def dirtext(self):

1377

def dirtext(self):

1378

"""Get the full data of this directory as a bytestring. Make sure that

1378

"""Get the full data of this directory as a bytestring. Make sure that

1379

any submanifests have been written first, so their nodeids are correct.

1379

any submanifests have been written first, so their nodeids are correct.

1380

"""

1380

"""

1381

self._load()

1381

self._load()

1382

flags = self.flags

1382

flags = self.flags

1383

lazydirs = [(d[:-1], v[0], b't') for d, v in self._lazydirs.items()]

1383

lazydirs = [(d[:-1], v[0], b't') for d, v in self._lazydirs.items()]

1384

dirs = [(d[:-1], self._dirs[d]._node, b't') for d in self._dirs]

1384

dirs = [(d[:-1], self._dirs[d]._node, b't') for d in self._dirs]

1385

files = [(f, self._files[f], flags(f)) for f in self._files]

1385

files = [(f, self._files[f], flags(f)) for f in self._files]

1386

return _text(sorted(dirs + files + lazydirs))

1386

return _text(sorted(dirs + files + lazydirs))

1387

1388

def read(self, gettext, readsubtree):

1388

def read(self, gettext, readsubtree):

1389

def _load_for_read(s):

1389

def _load_for_read(s):

1390

s.parse(gettext(), readsubtree)

1390

s.parse(gettext(), readsubtree)

1391

s._dirty = False

1391

s._dirty = False

1392

1393

self._loadfunc = _load_for_read

1393

self._loadfunc = _load_for_read

1394

1395

def writesubtrees(self, m1, m2, writesubtree, match):

1395

def writesubtrees(self, m1, m2, writesubtree, match):

1396

self._load() # for consistency; should never have any effect here

1396

self._load() # for consistency; should never have any effect here

1397

m1._load()

1397

m1._load()

1398

m2._load()

1398

m2._load()

1399

emptytree = treemanifest(self.nodeconstants)

1399

emptytree = treemanifest(self.nodeconstants)

1400

1401

def getnode(m, d):

1401

def getnode(m, d):

1402

ld = m._lazydirs.get(d)

1402

ld = m._lazydirs.get(d)

1403

if ld:

1403

if ld:

1404

return ld[0]

1404

return ld[0]

1405

return m._dirs.get(d, emptytree)._node

1405

return m._dirs.get(d, emptytree)._node

1406

1407

# let's skip investigating things that `match` says we do not need.

1407

# let's skip investigating things that `match` says we do not need.

1408

visit = match.visitchildrenset(self._dir[:-1])

1408

visit = match.visitchildrenset(self._dir[:-1])

1409

visit = self._loadchildrensetlazy(visit)

1409

visit = self._loadchildrensetlazy(visit)

1410

if visit == b'this' or visit == b'all':

1410

if visit == b'this' or visit == b'all':

1411

visit = None

1411

visit = None

1412

for d, subm in self._dirs.items():

1412

for d, subm in self._dirs.items():

1413

if visit and d[:-1] not in visit:

1413

if visit and d[:-1] not in visit:

1414

continue

1414

continue

1415

subp1 = getnode(m1, d)

1415

subp1 = getnode(m1, d)

1416

subp2 = getnode(m2, d)

1416

subp2 = getnode(m2, d)

1417

if subp1 == self.nodeconstants.nullid:

1417

if subp1 == self.nodeconstants.nullid:

1418

subp1, subp2 = subp2, subp1

1418

subp1, subp2 = subp2, subp1

1419

writesubtree(subm, subp1, subp2, match)

1419

writesubtree(subm, subp1, subp2, match)

1420

1421

def walksubtrees(self, matcher=None):

1421

def walksubtrees(self, matcher=None):

1422

"""Returns an iterator of the subtrees of this manifest, including this

1422

"""Returns an iterator of the subtrees of this manifest, including this

1423

manifest itself.

1423

manifest itself.

1424

1425

If `matcher` is provided, it only returns subtrees that match.

1425

If `matcher` is provided, it only returns subtrees that match.

1426

"""

1426

"""

1427

if matcher and not matcher.visitdir(self._dir[:-1]):

1427

if matcher and not matcher.visitdir(self._dir[:-1]):

1428

return

1428

return

1429

if not matcher or matcher(self._dir[:-1]):

1429

if not matcher or matcher(self._dir[:-1]):

1430

yield self

1430

yield self

1431

1432

self._load()

1432

self._load()

1433

# OPT: use visitchildrenset to avoid loading everything.

1433

# OPT: use visitchildrenset to avoid loading everything.

1434

self._loadalllazy()

1434

self._loadalllazy()

1435

for d, subm in self._dirs.items():

1435

for d, subm in self._dirs.items():

1436

for subtree in subm.walksubtrees(matcher=matcher):

1436

for subtree in subm.walksubtrees(matcher=matcher):

1437

yield subtree

1437

yield subtree

1438

1439

1440

class manifestfulltextcache(util.lrucachedict):

1440

class manifestfulltextcache(util.lrucachedict):

1441

"""File-backed LRU cache for the manifest cache

1441

"""File-backed LRU cache for the manifest cache

1442

1443

File consists of entries, up to EOF:

1443

File consists of entries, up to EOF:

1444

1445

- 20 bytes node, 4 bytes length, <length> manifest data

1445

- 20 bytes node, 4 bytes length, <length> manifest data

1446

1447

These are written in reverse cache order (oldest to newest).

1447

These are written in reverse cache order (oldest to newest).

1448

1449

"""

1449

"""

1450

1451

_file = b'manifestfulltextcache'

1451

_file = b'manifestfulltextcache'

1452

1453

def __init__(self, max):

1453

def __init__(self, max):

1454

super(manifestfulltextcache, self).__init__(max)

1454

super(manifestfulltextcache, self).__init__(max)

1455

self._dirty = False

1455

self._dirty = False

1456

self._read = False

1456

self._read = False

1457

self._opener = None

1457

self._opener = None

1458

1459

def read(self):

1459

def read(self):

1460

if self._read or self._opener is None:

1460

if self._read or self._opener is None:

1461

return

1461

return

1462

1463

try:

1463

try:

1464

with self._opener(self._file) as fp:

1464

with self._opener(self._file) as fp:

1465

set = super(manifestfulltextcache, self).__setitem__

1465

set = super(manifestfulltextcache, self).__setitem__

1466

# ignore trailing data, this is a cache, corruption is skipped

1466

# ignore trailing data, this is a cache, corruption is skipped

1467

while True:

1467

while True:

1468

# TODO do we need to do work here for sha1 portability?

1468

# TODO do we need to do work here for sha1 portability?

1469

node = fp.read(20)

1469

node = fp.read(20)

1470

if len(node) < 20:

1470

if len(node) < 20:

1471

break

1471

break

1472

try:

1472

try:

1473

size = struct.unpack(b'>L', fp.read(4))[0]

1473

size = struct.unpack(b'>L', fp.read(4))[0]

1474

except struct.error:

1474

except struct.error:

1475

break

1475

break

1476

value = bytearray(fp.read(size))

1476

value = bytearray(fp.read(size))

1477

if len(value) != size:

1477

if len(value) != size:

1478

break

1478

break

1479

set(node, value)

1479

set(node, value)

1480

except IOError:

1480

except IOError:

1481

# the file is allowed to be missing

1481

# the file is allowed to be missing

1482

pass

1482

pass

1483

1484

self._read = True

1484

self._read = True

1485

self._dirty = False

1485

self._dirty = False

1486

1487

def write(self):

1487

def write(self):

1488

if not self._dirty or self._opener is None:

1488

if not self._dirty or self._opener is None:

1489

return

1489

return

1490

# rotate backwards to the first used node

1490

# rotate backwards to the first used node

1491

try:

1491

try:

1492

with self._opener(

1492

with self._opener(

1493

self._file, b'w', atomictemp=True, checkambig=True

1493

self._file, b'w', atomictemp=True, checkambig=True

1494

) as fp:

1494

) as fp:

1495

node = self._head.prev

1495

node = self._head.prev

1496

while True:

1496

while True:

1497

if node.key in self._cache:

1497

if node.key in self._cache:

1498

fp.write(node.key)

1498

fp.write(node.key)

1499

fp.write(struct.pack(b'>L', len(node.value)))

1499

fp.write(struct.pack(b'>L', len(node.value)))

1500

fp.write(node.value)

1500

fp.write(node.value)

1501

if node is self._head:

1501

if node is self._head:

1502

break

1502

break

1503

node = node.prev

1503

node = node.prev

1504

except IOError:

1504

except IOError:

1505

# We could not write the cache (eg: permission error)

1505

# We could not write the cache (eg: permission error)

1506

# the content can be missing.

1506

# the content can be missing.

1507

#

1507

#

1508

# We could try harder and see if we could recreate a wcache

1508

# We could try harder and see if we could recreate a wcache

1509

# directory were we coudl write too.

1509

# directory were we coudl write too.

1510

#

1510

#

1511

# XXX the error pass silently, having some way to issue an error

1511

# XXX the error pass silently, having some way to issue an error

1512

# log `ui.log` would be nice.

1512

# log `ui.log` would be nice.

1513

pass

1513

pass

1514

1515

def __len__(self):

1515

def __len__(self):

1516

if not self._read:

1516

if not self._read:

1517

self.read()

1517

self.read()

1518

return super(manifestfulltextcache, self).__len__()

1518

return super(manifestfulltextcache, self).__len__()

1519

1520

def __contains__(self, k):

1520

def __contains__(self, k):

1521

if not self._read:

1521

if not self._read:

1522

self.read()

1522

self.read()

1523

return super(manifestfulltextcache, self).__contains__(k)

1523

return super(manifestfulltextcache, self).__contains__(k)

1524

1525

def __iter__(self):

1525

def __iter__(self):

1526

if not self._read:

1526

if not self._read:

1527

self.read()

1527

self.read()

1528

return super(manifestfulltextcache, self).__iter__()

1528

return super(manifestfulltextcache, self).__iter__()

1529

1530

def __getitem__(self, k):

1530

def __getitem__(self, k):

1531

if not self._read:

1531

if not self._read:

1532

self.read()

1532

self.read()

1533

# the cache lru order can change on read

1533

# the cache lru order can change on read

1534

setdirty = self._cache.get(k) is not self._head

1534

setdirty = self._cache.get(k) is not self._head

1535

value = super(manifestfulltextcache, self).__getitem__(k)

1535

value = super(manifestfulltextcache, self).__getitem__(k)

1536

if setdirty:

1536

if setdirty:

1537

self._dirty = True

1537

self._dirty = True

1538

return value

1538

return value

1539

1540

def __setitem__(self, k, v):

1540

def __setitem__(self, k, v):

1541

if not self._read:

1541

if not self._read:

1542

self.read()

1542

self.read()

1543

super(manifestfulltextcache, self).__setitem__(k, v)

1543

super(manifestfulltextcache, self).__setitem__(k, v)

1544

self._dirty = True

1544

self._dirty = True

1545

1546

def __delitem__(self, k):

1546

def __delitem__(self, k):

1547

if not self._read:

1547

if not self._read:

1548

self.read()

1548

self.read()

1549

super(manifestfulltextcache, self).__delitem__(k)

1549

super(manifestfulltextcache, self).__delitem__(k)

1550

self._dirty = True

1550

self._dirty = True

1551

1552

def get(self, k, default=None):

1552

def get(self, k, default=None):

1553

if not self._read:

1553

if not self._read:

1554

self.read()

1554

self.read()

1555

return super(manifestfulltextcache, self).get(k, default=default)

1555

return super(manifestfulltextcache, self).get(k, default=default)

1556

1557

def clear(self, clear_persisted_data=False):

1557

def clear(self, clear_persisted_data=False):

1558

super(manifestfulltextcache, self).clear()

1558

super(manifestfulltextcache, self).clear()

1559

if clear_persisted_data:

1559

if clear_persisted_data:

1560

self._dirty = True

1560

self._dirty = True

1561

self.write()

1561

self.write()

1562

self._read = False

1562

self._read = False

1563

1564

1565

# and upper bound of what we expect from compression

1565

# and upper bound of what we expect from compression

1566

# (real live value seems to be "3")

1566

# (real live value seems to be "3")

1567

MAXCOMPRESSION = 3

1567

MAXCOMPRESSION = 3

1568

1569

1570

class FastdeltaUnavailable(Exception):

1570

class FastdeltaUnavailable(Exception):

1571

"""Exception raised when fastdelta isn't usable on a manifest."""

1571

"""Exception raised when fastdelta isn't usable on a manifest."""

1572

1573

1574

@interfaceutil.implementer(repository.imanifeststorage)

1574

@interfaceutil.implementer(repository.imanifeststorage)

1575

class manifestrevlog:

1575

class manifestrevlog:

1576

"""A revlog that stores manifest texts. This is responsible for caching the

1576

"""A revlog that stores manifest texts. This is responsible for caching the

1577

full-text manifest contents.

1577

full-text manifest contents.

1578

"""

1578

"""

1579

1580

def __init__(

1580

def __init__(

1581

self,

1581

self,

1582

nodeconstants,

1582

nodeconstants,

1583

opener,

1583

opener,

1584

tree=b'',

1584

tree=b'',

1585

dirlogcache=None,

1585

dirlogcache=None,

1586

treemanifest=False,

1586

treemanifest=False,

1587

):

1587

):

1588

"""Constructs a new manifest revlog

1588

"""Constructs a new manifest revlog

1589

1590

`indexfile` - used by extensions to have two manifests at once, like

1590

`indexfile` - used by extensions to have two manifests at once, like

1591

when transitioning between flatmanifeset and treemanifests.

1591

when transitioning between flatmanifeset and treemanifests.

1592

1593

`treemanifest` - used to indicate this is a tree manifest revlog. Opener

1593

`treemanifest` - used to indicate this is a tree manifest revlog. Opener

1594

options can also be used to make this a tree manifest revlog. The opener

1594

options can also be used to make this a tree manifest revlog. The opener

1595

option takes precedence, so if it is set to True, we ignore whatever

1595

option takes precedence, so if it is set to True, we ignore whatever

1596

value is passed in to the constructor.

1596

value is passed in to the constructor.

1597

"""

1597

"""

1598

self.nodeconstants = nodeconstants

1598

self.nodeconstants = nodeconstants

1599

# During normal operations, we expect to deal with not more than four

1599

# During normal operations, we expect to deal with not more than four

1600

# revs at a time (such as during commit --amend). When rebasing large

1600

# revs at a time (such as during commit --amend). When rebasing large

1601

# stacks of commits, the number can go up, hence the config knob below.

1601

# stacks of commits, the number can go up, hence the config knob below.

1602

cachesize = 4

1602

cachesize = 4

1603

optiontreemanifest = False

1603

optiontreemanifest = False

1604

opts = getattr(opener, 'options', None)

1604

opts = getattr(opener, 'options', None)

1605

if opts is not None:

1605

if opts is not None:

1606

cachesize = opts.get(b'manifestcachesize', cachesize)

1606

cachesize = opts.get(b'manifestcachesize', cachesize)

1607

optiontreemanifest = opts.get(b'treemanifest', False)

1607

optiontreemanifest = opts.get(b'treemanifest', False)

1608

1609

self._treeondisk = optiontreemanifest or treemanifest

1609

self._treeondisk = optiontreemanifest or treemanifest

1610

1611

self._fulltextcache = manifestfulltextcache(cachesize)

1611

self._fulltextcache = manifestfulltextcache(cachesize)

1612

1613

if tree:

1613

if tree:

1614

assert self._treeondisk, (tree, b'opts is %r' % opts)

1614

assert self._treeondisk, (tree, b'opts is %r' % opts)

1615

1616

radix = b'00manifest'

1616

radix = b'00manifest'

1617

if tree:

1617

if tree:

1618

radix = b"meta/" + tree + radix

1618

radix = b"meta/" + tree + radix

1619

1620

self.tree = tree

1620

self.tree = tree

1621

1622

# The dirlogcache is kept on the root manifest log

1622

# The dirlogcache is kept on the root manifest log

1623

if tree:

1623

if tree:

1624

self._dirlogcache = dirlogcache

1624

self._dirlogcache = dirlogcache

1625

else:

1625

else:

1626

self._dirlogcache = {b'': self}

1626

self._dirlogcache = {b'': self}

1627

1628

self._revlog = revlog.revlog(

1628

self._revlog = revlog.revlog(

1629

opener,

1629

opener,

1630

target=(revlog_constants.KIND_MANIFESTLOG, self.tree),

1630

target=(revlog_constants.KIND_MANIFESTLOG, self.tree),

1631

radix=radix,

1631

radix=radix,

1632

# only root indexfile is cached

1632

# only root indexfile is cached

1633

checkambig=not bool(tree),

1633

checkambig=not bool(tree),

1634

mmaplargeindex=True,

1634

mmaplargeindex=True,

1635

upperboundcomp=MAXCOMPRESSION,

1635

upperboundcomp=MAXCOMPRESSION,

1636

persistentnodemap=opener.options.get(b'persistent-nodemap', False),

1636

persistentnodemap=opener.options.get(b'persistent-nodemap', False),

1637

)

1637

)

1638

1639

self.index = self._revlog.index

1639

self.index = self._revlog.index

1640

1641

def get_revlog(self):

1641

def get_revlog(self):

1642

"""return an actual revlog instance if any

1642

"""return an actual revlog instance if any

1643

1644

This exist because a lot of code leverage the fact the underlying

1644

This exist because a lot of code leverage the fact the underlying

1645

storage is a revlog for optimization, so giving simple way to access

1645

storage is a revlog for optimization, so giving simple way to access

1646

the revlog instance helps such code.

1646

the revlog instance helps such code.

1647

"""

1647

"""

1648

return self._revlog

1648

return self._revlog

1649

1650

def _setupmanifestcachehooks(self, repo):

1650

def _setupmanifestcachehooks(self, repo):

1651

"""Persist the manifestfulltextcache on lock release"""

1651

"""Persist the manifestfulltextcache on lock release"""

1652

if not hasattr(repo, '_wlockref'):

1652

if not hasattr(repo, '_wlockref'):

1653

return

1653

return

1654

1655

self._fulltextcache._opener = repo.wcachevfs

1655

self._fulltextcache._opener = repo.wcachevfs

1656

if repo._currentlock(repo._wlockref) is None:

1656

if repo._currentlock(repo._wlockref) is None:

1657

return

1657

return

1658

1659

reporef = weakref.ref(repo)

1659

reporef = weakref.ref(repo)

1660

manifestrevlogref = weakref.ref(self)

1660

manifestrevlogref = weakref.ref(self)

1661

1662

def persistmanifestcache(success):

1662

def persistmanifestcache(success):

1663

# Repo is in an unknown state, do not persist.

1663

# Repo is in an unknown state, do not persist.

1664

if not success:

1664

if not success:

1665

return

1665

return

1666

1667

repo = reporef()

1667

repo = reporef()

1668

self = manifestrevlogref()

1668

self = manifestrevlogref()

1669

if repo is None or self is None:

1669

if repo is None or self is None:

1670

return

1670

return

1671

if repo.manifestlog.getstorage(b'') is not self:

1671

if repo.manifestlog.getstorage(b'') is not self:

1672

# there's a different manifest in play now, abort

1672

# there's a different manifest in play now, abort

1673

return

1673

return

1674

self._fulltextcache.write()

1674

self._fulltextcache.write()

1675

1676

repo._afterlock(persistmanifestcache)

1676

repo._afterlock(persistmanifestcache)

1677

1678

@property

1678

@property

1679

def fulltextcache(self):

1679

def fulltextcache(self):

1680

return self._fulltextcache

1680

return self._fulltextcache

1681

1682

def clearcaches(self, clear_persisted_data=False):

1682

def clearcaches(self, clear_persisted_data=False):

1683

self._revlog.clearcaches()

1683

self._revlog.clearcaches()

1684

self._fulltextcache.clear(clear_persisted_data=clear_persisted_data)

1684

self._fulltextcache.clear(clear_persisted_data=clear_persisted_data)

1685

self._dirlogcache = {self.tree: self}

1685

self._dirlogcache = {self.tree: self}

1686

1687

def dirlog(self, d):

1687

def dirlog(self, d):

1688

if d:

1688

if d:

1689

assert self._treeondisk

1689

assert self._treeondisk

1690

if d not in self._dirlogcache:

1690

if d not in self._dirlogcache:

1691

mfrevlog = manifestrevlog(

1691

mfrevlog = manifestrevlog(

1692

self.nodeconstants,

1692

self.nodeconstants,

1693

self.opener,

1693

self.opener,

1694

d,

1694

d,

1695

self._dirlogcache,

1695

self._dirlogcache,

1696

treemanifest=self._treeondisk,

1696

treemanifest=self._treeondisk,

1697

)

1697

)

1698

self._dirlogcache[d] = mfrevlog

1698

self._dirlogcache[d] = mfrevlog

1699

return self._dirlogcache[d]

1699

return self._dirlogcache[d]

1700

1701

def add(

1701

def add(

1702

self,

1702

self,

1703

m,

1703

m,

1704

transaction,

1704

transaction,

1705

link,

1705

link,

1706

p1,

1706

p1,

1707

p2,

1707

p2,

1708

added,

1708

added,

1709

removed,

1709

removed,

1710

readtree=None,

1710

readtree=None,

1711

match=None,

1711

match=None,

1712

):

1712

):

1713

"""add some manifest entry in to the manifest log

1713

"""add some manifest entry in to the manifest log

1714

1715

input:

1715

input:

1716

1717

m: the manifest dict we want to store

1717

m: the manifest dict we want to store

1718

transaction: the open transaction

1718

transaction: the open transaction

1719

p1: manifest-node of p1

1719

p1: manifest-node of p1

1720

p2: manifest-node of p2

1720

p2: manifest-node of p2

1721

added: file added/changed compared to parent

1721

added: file added/changed compared to parent

1722

removed: file removed compared to parent

1722

removed: file removed compared to parent

1723

1724

tree manifest input:

1724

tree manifest input:

1725

1726

readtree: a function to read a subtree

1726

readtree: a function to read a subtree

1727

match: a filematcher for the subpart of the tree manifest

1727

match: a filematcher for the subpart of the tree manifest

1728

"""

1728

"""

1729

try:

1729

try:

1730

if p1 not in self.fulltextcache:

1730

if p1 not in self.fulltextcache:

1731

raise FastdeltaUnavailable()

1731

raise FastdeltaUnavailable()

1732

# If our first parent is in the manifest cache, we can

1732

# If our first parent is in the manifest cache, we can

1733

# compute a delta here using properties we know about the

1733

# compute a delta here using properties we know about the

1734

# manifest up-front, which may save time later for the

1734

# manifest up-front, which may save time later for the

1735

# revlog layer.

1735

# revlog layer.

1736

1737

_checkforbidden(added)

1737

_checkforbidden(added)

1738

# combine the changed lists into one sorted iterator

1738

# combine the changed lists into one sorted iterator

1739

work = heapq.merge(

1739

work = heapq.merge(

1740

[(x, False) for x in sorted(added)],

1740

[(x, False) for x in sorted(added)],

1741

[(x, True) for x in sorted(removed)],

1741

[(x, True) for x in sorted(removed)],

1742

)

1742

)

1743

1744

arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)

1744

arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)

1745

cachedelta = self._revlog.rev(p1), deltatext

1745

cachedelta = self._revlog.rev(p1), deltatext

1746

text = util.buffer(arraytext)

1746

text = util.buffer(arraytext)

1747

rev = self._revlog.addrevision(

1747

rev = self._revlog.addrevision(

1748

text, transaction, link, p1, p2, cachedelta

1748

text, transaction, link, p1, p2, cachedelta

1749

)

1749

)

1750

n = self._revlog.node(rev)

1750

n = self._revlog.node(rev)

1751

except FastdeltaUnavailable:

1751

except FastdeltaUnavailable:

1752

# The first parent manifest isn't already loaded or the

1752

# The first parent manifest isn't already loaded or the

1753

# manifest implementation doesn't support fastdelta, so

1753

# manifest implementation doesn't support fastdelta, so

1754

# we'll just encode a fulltext of the manifest and pass

1754

# we'll just encode a fulltext of the manifest and pass

1755

# that through to the revlog layer, and let it handle the

1755

# that through to the revlog layer, and let it handle the

1756

# delta process.

1756

# delta process.

1757

if self._treeondisk:

1757

if self._treeondisk:

1758

assert readtree, b"readtree must be set for treemanifest writes"

1758

assert readtree, b"readtree must be set for treemanifest writes"

1759

assert match, b"match must be specified for treemanifest writes"

1759

assert match, b"match must be specified for treemanifest writes"

1760

m1 = readtree(self.tree, p1)

1760

m1 = readtree(self.tree, p1)

1761

m2 = readtree(self.tree, p2)

1761

m2 = readtree(self.tree, p2)

1762

n = self._addtree(

1762

n = self._addtree(

1763

m, transaction, link, m1, m2, readtree, match=match

1763

m, transaction, link, m1, m2, readtree, match=match

1764

)

1764

)

1765

arraytext = None

1765

arraytext = None

1766

else:

1766

else:

1767

text = m.text()

1767

text = m.text()

1768

rev = self._revlog.addrevision(text, transaction, link, p1, p2)

1768

rev = self._revlog.addrevision(text, transaction, link, p1, p2)

1769

n = self._revlog.node(rev)

1769

n = self._revlog.node(rev)

1770

arraytext = bytearray(text)

1770

arraytext = bytearray(text)

1771

1772

if arraytext is not None:

1772

if arraytext is not None:

1773

self.fulltextcache[n] = arraytext

1773

self.fulltextcache[n] = arraytext

1774

1775

return n

1775

return n

1776

1777

def _addtree(self, m, transaction, link, m1, m2, readtree, match):

1777

def _addtree(self, m, transaction, link, m1, m2, readtree, match):

1778

# If the manifest is unchanged compared to one parent,

1778

# If the manifest is unchanged compared to one parent,

1779

# don't write a new revision

1779

# don't write a new revision

1780

if self.tree != b'' and (

1780

if self.tree != b'' and (

1781

m.unmodifiedsince(m1) or m.unmodifiedsince(m2)

1781

m.unmodifiedsince(m1) or m.unmodifiedsince(m2)

1782

):

1782

):

1783

return m.node()

1783

return m.node()

1784

1785

def writesubtree(subm, subp1, subp2, match):

1785

def writesubtree(subm, subp1, subp2, match):

1786

sublog = self.dirlog(subm.dir())

1786

sublog = self.dirlog(subm.dir())

1787

sublog.add(

1787

sublog.add(

1788

subm,

1788

subm,

1789

transaction,

1789

transaction,

1790

link,

1790

link,

1791

subp1,

1791

subp1,

1792

subp2,

1792

subp2,

1793

None,

1793

None,

1794

None,

1794

None,

1795

readtree=readtree,

1795

readtree=readtree,

1796

match=match,

1796

match=match,

1797

)

1797

)

1798

1799

m.writesubtrees(m1, m2, writesubtree, match)

1799

m.writesubtrees(m1, m2, writesubtree, match)

1800

text = m.dirtext()

1800

text = m.dirtext()

1801

n = None

1801

n = None

1802

if self.tree != b'':

1802

if self.tree != b'':

1803

# Double-check whether contents are unchanged to one parent

1803

# Double-check whether contents are unchanged to one parent

1804

if text == m1.dirtext():

1804

if text == m1.dirtext():

1805

n = m1.node()

1805

n = m1.node()

1806

elif text == m2.dirtext():

1806

elif text == m2.dirtext():

1807

n = m2.node()

1807

n = m2.node()

1808

1809

if not n:

1809

if not n:

1810

rev = self._revlog.addrevision(

1810

rev = self._revlog.addrevision(

1811

text, transaction, link, m1.node(), m2.node()

1811

text, transaction, link, m1.node(), m2.node()

1812

)

1812

)

1813

n = self._revlog.node(rev)

1813

n = self._revlog.node(rev)

1814

1815

# Save nodeid so parent manifest can calculate its nodeid

1815

# Save nodeid so parent manifest can calculate its nodeid

1816

m.setnode(n)

1816

m.setnode(n)

1817

return n

1817

return n

1818

1819

def __len__(self):

1819

def __len__(self):

1820

return len(self._revlog)

1820

return len(self._revlog)

1821

1822

def __iter__(self):

1822

def __iter__(self):

1823

return self._revlog.__iter__()

1823

return self._revlog.__iter__()

1824

1825

def rev(self, node):

1825

def rev(self, node):

1826

return self._revlog.rev(node)

1826

return self._revlog.rev(node)

1827

1828

def node(self, rev):

1828

def node(self, rev):

1829

return self._revlog.node(rev)

1829

return self._revlog.node(rev)

1830

1831

def lookup(self, value):

1831

def lookup(self, value):

1832

return self._revlog.lookup(value)

1832

return self._revlog.lookup(value)

1833

1834

def parentrevs(self, rev):

1834

def parentrevs(self, rev):

1835

return self._revlog.parentrevs(rev)

1835

return self._revlog.parentrevs(rev)

1836

1837

def parents(self, node):

1837

def parents(self, node):

1838

return self._revlog.parents(node)

1838

return self._revlog.parents(node)

1839

1840

def linkrev(self, rev):

1840

def linkrev(self, rev):

1841

return self._revlog.linkrev(rev)

1841

return self._revlog.linkrev(rev)

1842

1843

def checksize(self):

1843

def checksize(self):

1844

return self._revlog.checksize()

1844

return self._revlog.checksize()

1845

1846

def revision(self, node):

1846

def revision(self, node):

1847

return self._revlog.revision(node)

1847

return self._revlog.revision(node)

1848

1849

def rawdata(self, node):

1849

def rawdata(self, node):

1850

return self._revlog.rawdata(node)

1850

return self._revlog.rawdata(node)

1851

1852

def revdiff(self, rev1, rev2):

1852

def revdiff(self, rev1, rev2):

1853

return self._revlog.revdiff(rev1, rev2)

1853

return self._revlog.revdiff(rev1, rev2)

1854

1855

def cmp(self, node, text):

1855

def cmp(self, node, text):

1856

return self._revlog.cmp(node, text)

1856

return self._revlog.cmp(node, text)

1857

1858

def deltaparent(self, rev):

1858

def deltaparent(self, rev):

1859

return self._revlog.deltaparent(rev)

1859

return self._revlog.deltaparent(rev)

1860

1861

def emitrevisions(

1861

def emitrevisions(

1862

self,

1862

self,

1863

nodes,

1863

nodes,

1864

nodesorder=None,

1864

nodesorder=None,

1865

revisiondata=False,

1865

revisiondata=False,

1866

assumehaveparentrevisions=False,

1866

assumehaveparentrevisions=False,

1867

deltamode=repository.CG_DELTAMODE_STD,

1867

deltamode=repository.CG_DELTAMODE_STD,

1868

sidedata_helpers=None,

1868

sidedata_helpers=None,

1869

debug_info=None,

1869

debug_info=None,

1870

):

1870

):

1871

return self._revlog.emitrevisions(

1871

return self._revlog.emitrevisions(

1872

nodes,

1872

nodes,

1873

nodesorder=nodesorder,

1873

nodesorder=nodesorder,

1874

revisiondata=revisiondata,

1874

revisiondata=revisiondata,

1875

assumehaveparentrevisions=assumehaveparentrevisions,

1875

assumehaveparentrevisions=assumehaveparentrevisions,

1876

deltamode=deltamode,

1876

deltamode=deltamode,

1877

sidedata_helpers=sidedata_helpers,

1877

sidedata_helpers=sidedata_helpers,

1878

debug_info=debug_info,

1878

debug_info=debug_info,

1879

)

1879

)

1880

1881

def addgroup(

1881

def addgroup(

1882

self,

1882

self,

1883

deltas,

1883

deltas,

1884

linkmapper,

1884

linkmapper,

1885

transaction,

1885

transaction,

1886

alwayscache=False,

1886

alwayscache=False,

1887

addrevisioncb=None,

1887

addrevisioncb=None,

1888

duplicaterevisioncb=None,

1888

duplicaterevisioncb=None,

1889

debug_info=None,

1889

debug_info=None,

1890

delta_base_reuse_policy=None,

1890

delta_base_reuse_policy=None,

1891

):

1891

):

1892

return self._revlog.addgroup(

1892

return self._revlog.addgroup(

1893

deltas,

1893

deltas,

1894

linkmapper,

1894

linkmapper,

1895

transaction,

1895

transaction,

1896

alwayscache=alwayscache,

1896

alwayscache=alwayscache,

1897

addrevisioncb=addrevisioncb,

1897

addrevisioncb=addrevisioncb,

1898

duplicaterevisioncb=duplicaterevisioncb,

1898

duplicaterevisioncb=duplicaterevisioncb,

1899

debug_info=debug_info,

1899

debug_info=debug_info,

1900

delta_base_reuse_policy=delta_base_reuse_policy,

1900

delta_base_reuse_policy=delta_base_reuse_policy,

1901

)

1901

)

1902

1903

def rawsize(self, rev):

1903

def rawsize(self, rev):

1904

return self._revlog.rawsize(rev)

1904

return self._revlog.rawsize(rev)

1905

1906

def getstrippoint(self, minlink):

1906

def getstrippoint(self, minlink):

1907

return self._revlog.getstrippoint(minlink)

1907

return self._revlog.getstrippoint(minlink)

1908

1909

def strip(self, minlink, transaction):

1909

def strip(self, minlink, transaction):

1910

return self._revlog.strip(minlink, transaction)

1910

return self._revlog.strip(minlink, transaction)

1911

1912

def files(self):

1912

def files(self):

1913

return self._revlog.files()

1913

return self._revlog.files()

1914

1915

def clone(self, tr, destrevlog, **kwargs):

1915

def clone(self, tr, destrevlog, **kwargs):

1916

if not isinstance(destrevlog, manifestrevlog):

1916

if not isinstance(destrevlog, manifestrevlog):

1917

raise error.ProgrammingError(b'expected manifestrevlog to clone()')

1917

raise error.ProgrammingError(b'expected manifestrevlog to clone()')

1918

1919

return self._revlog.clone(tr, destrevlog._revlog, **kwargs)

1919

return self._revlog.clone(tr, destrevlog._revlog, **kwargs)

1920

1921

def storageinfo(

1921

def storageinfo(

1922

self,

1922

self,

1923

exclusivefiles=False,

1923

exclusivefiles=False,

1924

sharedfiles=False,

1924

sharedfiles=False,

1925

revisionscount=False,

1925

revisionscount=False,

1926

trackedsize=False,

1926

trackedsize=False,

1927

storedsize=False,

1927

storedsize=False,

1928

):

1928

):

1929

return self._revlog.storageinfo(

1929

return self._revlog.storageinfo(

1930

exclusivefiles=exclusivefiles,

1930

exclusivefiles=exclusivefiles,

1931

sharedfiles=sharedfiles,

1931

sharedfiles=sharedfiles,

1932

revisionscount=revisionscount,

1932

revisionscount=revisionscount,

1933

trackedsize=trackedsize,

1933

trackedsize=trackedsize,

1934

storedsize=storedsize,

1934

storedsize=storedsize,

1935

)

1935

)

1936

1937

@property

1937

@property

1938

def opener(self):

1938

def opener(self):

1939

return self._revlog.opener

1939

return self._revlog.opener

1940

1941

@opener.setter

1941

@opener.setter

1942

def opener(self, value):

1942

def opener(self, value):

1943

self._revlog.opener = value

1943

self._revlog.opener = value

1944

1945

1946

@interfaceutil.implementer(repository.imanifestlog)

1946

@interfaceutil.implementer(repository.imanifestlog)

1947

class manifestlog:

1947

class manifestlog:

1948

"""A collection class representing the collection of manifest snapshots

1948

"""A collection class representing the collection of manifest snapshots

1949

referenced by commits in the repository.

1949

referenced by commits in the repository.

1950

1951

In this situation, 'manifest' refers to the abstract concept of a snapshot

1951

In this situation, 'manifest' refers to the abstract concept of a snapshot

1952

of the list of files in the given commit. Consumers of the output of this

1952

of the list of files in the given commit. Consumers of the output of this

1953

class do not care about the implementation details of the actual manifests

1953

class do not care about the implementation details of the actual manifests

1954

they receive (i.e. tree or flat or lazily loaded, etc)."""

1954

they receive (i.e. tree or flat or lazily loaded, etc)."""

1955

1956

def __init__(self, opener, repo, rootstore, narrowmatch):

1956

def __init__(self, opener, repo, rootstore, narrowmatch):

1957

self.nodeconstants = repo.nodeconstants

1957

self.nodeconstants = repo.nodeconstants

1958

usetreemanifest = False

1958

usetreemanifest = False

1959

cachesize = 4

1959

cachesize = 4

1960

1961

opts = getattr(opener, 'options', None)

1961

opts = getattr(opener, 'options', None)

1962

if opts is not None:

1962

if opts is not None:

1963

usetreemanifest = opts.get(b'treemanifest', usetreemanifest)

1963

usetreemanifest = opts.get(b'treemanifest', usetreemanifest)

1964

cachesize = opts.get(b'manifestcachesize', cachesize)

1964

cachesize = opts.get(b'manifestcachesize', cachesize)

1965

1966

self._treemanifests = usetreemanifest

1966

self._treemanifests = usetreemanifest

1967

1968

self._rootstore = rootstore

1968

self._rootstore = rootstore

1969

self._rootstore._setupmanifestcachehooks(repo)

1969

self._rootstore._setupmanifestcachehooks(repo)

1970

self._narrowmatch = narrowmatch

1970

self._narrowmatch = narrowmatch

1971

1972

# A cache of the manifestctx or treemanifestctx for each directory

1972

# A cache of the manifestctx or treemanifestctx for each directory

1973

self._dirmancache = {}

1973

self._dirmancache = {}

1974

self._dirmancache[b''] = util.lrucachedict(cachesize)

1974

self._dirmancache[b''] = util.lrucachedict(cachesize)

1975

1976

self._cachesize = cachesize

1976

self._cachesize = cachesize

1977

1978

def __getitem__(self, node):

1978

def __getitem__(self, node):

1979

"""Retrieves the manifest instance for the given node. Throws a

1979

"""Retrieves the manifest instance for the given node. Throws a

1980

LookupError if not found.

1980

LookupError if not found.

1981

"""

1981

"""

1982

return self.get(b'', node)

1982

return self.get(b'', node)

1983

1984

def get(self, tree, node, verify=True):

1984

def get(self, tree, node, verify=True):

1985

"""Retrieves the manifest instance for the given node. Throws a

1985

"""Retrieves the manifest instance for the given node. Throws a

1986

LookupError if not found.

1986

LookupError if not found.

1987

1988

`verify` - if True an exception will be thrown if the node is not in

1988

`verify` - if True an exception will be thrown if the node is not in

1989

the revlog

1989

the revlog

1990

"""

1990

"""

1991

if node in self._dirmancache.get(tree, ()):

1991

if node in self._dirmancache.get(tree, ()):

1992

return self._dirmancache[tree][node]

1992

return self._dirmancache[tree][node]

1993

1994

if not self._narrowmatch.always():

1994

if not self._narrowmatch.always():

1995

if not self._narrowmatch.visitdir(tree[:-1]):

1995

if not self._narrowmatch.visitdir(tree[:-1]):

1996

return excludeddirmanifestctx(self.nodeconstants, tree, node)

1996

return excludeddirmanifestctx(self.nodeconstants, tree, node)

1997

if tree:

1997

if tree:

1998

if self._rootstore._treeondisk:

1998

if self._rootstore._treeondisk:

1999

if verify:

1999

if verify:

2000

# Side-effect is LookupError is raised if node doesn't

2000

# Side-effect is LookupError is raised if node doesn't

2001

# exist.

2001

# exist.

2002

self.getstorage(tree).rev(node)

2002

self.getstorage(tree).rev(node)

2003

2004

m = treemanifestctx(self, tree, node)

2004

m = treemanifestctx(self, tree, node)

2005

else:

2005

else:

2006

raise error.Abort(

2006

raise error.Abort(

2007

_(

2007

_(

2008

b"cannot ask for manifest directory '%s' in a flat "

2008

b"cannot ask for manifest directory '%s' in a flat "

2009

b"manifest"

2009

b"manifest"

2010

)

2010

)

2011

% tree

2011

% tree

2012

)

2012

)

2013

else:

2013

else:

2014

if verify:

2014

if verify:

2015

# Side-effect is LookupError is raised if node doesn't exist.

2015

# Side-effect is LookupError is raised if node doesn't exist.

2016

self._rootstore.rev(node)

2016

self._rootstore.rev(node)

2017

2018

if self._treemanifests:

2018

if self._treemanifests:

2019

m = treemanifestctx(self, b'', node)

2019

m = treemanifestctx(self, b'', node)

2020

else:

2020

else:

2021

m = manifestctx(self, node)

2021

m = manifestctx(self, node)

2022

2023

if node != self.nodeconstants.nullid:

2023

if node != self.nodeconstants.nullid:

2024

mancache = self._dirmancache.get(tree)

2024

mancache = self._dirmancache.get(tree)

2025

if not mancache:

2025

if not mancache:

2026

mancache = util.lrucachedict(self._cachesize)

2026

mancache = util.lrucachedict(self._cachesize)

2027

self._dirmancache[tree] = mancache

2027

self._dirmancache[tree] = mancache

2028

mancache[node] = m

2028

mancache[node] = m

2029

return m

2029

return m

2030

2031

def getstorage(self, tree):

2031

def getstorage(self, tree):

2032

return self._rootstore.dirlog(tree)

2032

return self._rootstore.dirlog(tree)

2033

2034

def clearcaches(self, clear_persisted_data=False):

2034

def clearcaches(self, clear_persisted_data=False):

2035

self._dirmancache.clear()

2035

self._dirmancache.clear()

2036

self._rootstore.clearcaches(clear_persisted_data=clear_persisted_data)

2036

self._rootstore.clearcaches(clear_persisted_data=clear_persisted_data)

2037

2038

def rev(self, node):

2038

def rev(self, node):

2039

return self._rootstore.rev(node)

2039

return self._rootstore.rev(node)

2040

2041

def update_caches(self, transaction):

2041

def update_caches(self, transaction):

2042

return self._rootstore._revlog.update_caches(transaction=transaction)

2042

return self._rootstore._revlog.update_caches(transaction=transaction)

2043

2044

2045

@interfaceutil.implementer(repository.imanifestrevisionwritable)

2045

@interfaceutil.implementer(repository.imanifestrevisionwritable)

2046

class memmanifestctx:

2046

class memmanifestctx:

2047

def __init__(self, manifestlog):

2047

def __init__(self, manifestlog):

2048

self._manifestlog = manifestlog

2048

self._manifestlog = manifestlog

2049

self._manifestdict = manifestdict(manifestlog.nodeconstants.nodelen)

2049

self._manifestdict = manifestdict(manifestlog.nodeconstants.nodelen)

2050

2051

def _storage(self):

2051

def _storage(self):

2052

return self._manifestlog.getstorage(b'')

2052

return self._manifestlog.getstorage(b'')

2053

2054

def copy(self):

2054

def copy(self):

2055

memmf = memmanifestctx(self._manifestlog)

2055

memmf = memmanifestctx(self._manifestlog)

2056

memmf._manifestdict = self.read().copy()

2056

memmf._manifestdict = self.read().copy()

2057

return memmf

2057

return memmf

2058

2059

def read(self):

2059

def read(self):

2060

return self._manifestdict

2060

return self._manifestdict

2061

2062

def write(self, transaction, link, p1, p2, added, removed, match=None):

2062

def write(self, transaction, link, p1, p2, added, removed, match=None):

2063

return self._storage().add(

2063

return self._storage().add(

2064

self._manifestdict,

2064

self._manifestdict,

2065

transaction,

2065

transaction,

2066

link,

2066

link,

2067

p1,

2067

p1,

2068

p2,

2068

p2,

2069

added,

2069

added,

2070

removed,

2070

removed,

2071

match=match,

2071

match=match,

2072

)

2072

)

2073

2074

2075

@interfaceutil.implementer(repository.imanifestrevisionstored)

2075

@interfaceutil.implementer(repository.imanifestrevisionstored)

2076

class manifestctx:

2076

class manifestctx:

2077

"""A class representing a single revision of a manifest, including its

2077

"""A class representing a single revision of a manifest, including its

2078

contents, its parent revs, and its linkrev.

2078

contents, its parent revs, and its linkrev.

2079

"""

2079

"""

2080

2081

def __init__(self, manifestlog, node):

2081

def __init__(self, manifestlog, node):

2082

self._manifestlog = manifestlog

2082

self._manifestlog = manifestlog

2083

self._data = None

2083

self._data = None

2084

2085

self._node = node

2085

self._node = node

2086

2087

# TODO: We eventually want p1, p2, and linkrev exposed on this class,

2087

# TODO: We eventually want p1, p2, and linkrev exposed on this class,

2088

# but let's add it later when something needs it and we can load it

2088

# but let's add it later when something needs it and we can load it

2089

# lazily.

2089

# lazily.

2090

# self.p1, self.p2 = store.parents(node)

2090

# self.p1, self.p2 = store.parents(node)

2091

# rev = store.rev(node)

2091

# rev = store.rev(node)

2092

# self.linkrev = store.linkrev(rev)

2092

# self.linkrev = store.linkrev(rev)

2093

2094

def _storage(self):

2094

def _storage(self):

2095

return self._manifestlog.getstorage(b'')

2095

return self._manifestlog.getstorage(b'')

2096

2097

def node(self):

2097

def node(self):

2098

return self._node

2098

return self._node

2099

2100

def copy(self):

2100

def copy(self):

2101

memmf = memmanifestctx(self._manifestlog)

2101

memmf = memmanifestctx(self._manifestlog)

2102

memmf._manifestdict = self.read().copy()

2102

memmf._manifestdict = self.read().copy()

2103

return memmf

2103

return memmf

2104

2105

@propertycache

2105

@propertycache

2106

def parents(self):

2106

def parents(self):

2107

return self._storage().parents(self._node)

2107

return self._storage().parents(self._node)

2108

2109

def read(self):

2109

def read(self):

2110

if self._data is None:

2110

if self._data is None:

2111

nc = self._manifestlog.nodeconstants

2111

nc = self._manifestlog.nodeconstants

2112

if self._node == nc.nullid:

2112

if self._node == nc.nullid:

2113

self._data = manifestdict(nc.nodelen)

2113

self._data = manifestdict(nc.nodelen)

2114

else:

2114

else:

2115

store = self._storage()

2115

store = self._storage()

2116

if self._node in store.fulltextcache:

2116

if self._node in store.fulltextcache:

2117

text = pycompat.bytestr(store.fulltextcache[self._node])

2117

text = pycompat.bytestr(store.fulltextcache[self._node])

2118

else:

2118

else:

2119

text = store.revision(self._node)

2119

text = store.revision(self._node)

2120

arraytext = bytearray(text)

2120

arraytext = bytearray(text)

2121

store.fulltextcache[self._node] = arraytext

2121

store.fulltextcache[self._node] = arraytext

2122

self._data = manifestdict(nc.nodelen, text)

2122

self._data = manifestdict(nc.nodelen, text)

2123

return self._data

2123

return self._data

2124

2125

def readfast(self, shallow=False):

2125

def readfast(self, shallow=False):

2126

"""Calls either readdelta or read, based on which would be less work.

2126

"""Calls either readdelta or read, based on which would be less work.

2127

readdelta is called if the delta is against the p1, and therefore can be

2127

readdelta is called if the delta is against the p1, and therefore can be

2128

read quickly.

2128

read quickly.

2129

2130

If `shallow` is True, nothing changes since this is a flat manifest.

2130

If `shallow` is True, nothing changes since this is a flat manifest.

2131

"""

2131

"""

2132

store = self._storage()

2132

store = self._storage()

2133

r = store.rev(self._node)

2133

r = store.rev(self._node)

2134

deltaparent = store.deltaparent(r)

2134

deltaparent = store.deltaparent(r)

2135

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2135

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2136

return self.readdelta()

2136

return self.readdelta()

2137

return self.read()

2137

return self.read()

2138

2139

def readdelta(self, shallow=False):

2139

def readdelta(self, shallow=False):

2140

"""Returns a manifest containing just the entries that are present

2140

"""Returns a manifest containing just the entries that are present

2141

in this manifest, but not in its p1 manifest. This is efficient to read

2141

in this manifest, but not in its p1 manifest. This is efficient to read

2142

if the revlog delta is already p1.

2142

if the revlog delta is already p1.

2143

2144

Changing the value of `shallow` has no effect on flat manifests.

2144

Changing the value of `shallow` has no effect on flat manifests.

2145

"""

2145

"""

2146

store = self._storage()

2146

store = self._storage()

2147

r = store.rev(self._node)

2147

r = store.rev(self._node)

2148

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2148

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2149

return manifestdict(store.nodeconstants.nodelen, d)

2149

return manifestdict(store.nodeconstants.nodelen, d)

2150

2151

def find(self, key):

2151

def find(self, key):

2152

return self.read().find(key)

2152

return self.read().find(key)

2153

2154

2155

@interfaceutil.implementer(repository.imanifestrevisionwritable)

2155

@interfaceutil.implementer(repository.imanifestrevisionwritable)

2156

class memtreemanifestctx:

2156

class memtreemanifestctx:

2157

def __init__(self, manifestlog, dir=b''):

2157

def __init__(self, manifestlog, dir=b''):

2158

self._manifestlog = manifestlog

2158

self._manifestlog = manifestlog

2159

self._dir = dir

2159

self._dir = dir

2160

self._treemanifest = treemanifest(manifestlog.nodeconstants)

2160

self._treemanifest = treemanifest(manifestlog.nodeconstants)

2161

2162

def _storage(self):

2162

def _storage(self):

2163

return self._manifestlog.getstorage(b'')

2163

return self._manifestlog.getstorage(b'')

2164

2165

def copy(self):

2165

def copy(self):

2166

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2166

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2167

memmf._treemanifest = self._treemanifest.copy()

2167

memmf._treemanifest = self._treemanifest.copy()

2168

return memmf

2168

return memmf

2169

2170

def read(self):

2170

def read(self):

2171

return self._treemanifest

2171

return self._treemanifest

2172

2173

def write(self, transaction, link, p1, p2, added, removed, match=None):

2173

def write(self, transaction, link, p1, p2, added, removed, match=None):

2174

def readtree(dir, node):

2174

def readtree(dir, node):

2175

return self._manifestlog.get(dir, node).read()

2175

return self._manifestlog.get(dir, node).read()

2176

2177

return self._storage().add(

2177

return self._storage().add(

2178

self._treemanifest,

2178

self._treemanifest,

2179

transaction,

2179

transaction,

2180

link,

2180

link,

2181

p1,

2181

p1,

2182

p2,

2182

p2,

2183

added,

2183

added,

2184

removed,

2184

removed,

2185

readtree=readtree,

2185

readtree=readtree,

2186

match=match,

2186

match=match,

2187

)

2187

)

2188

2189

2190

@interfaceutil.implementer(repository.imanifestrevisionstored)

2190

@interfaceutil.implementer(repository.imanifestrevisionstored)

2191

class treemanifestctx:

2191

class treemanifestctx:

2192

def __init__(self, manifestlog, dir, node):

2192

def __init__(self, manifestlog, dir, node):

2193

self._manifestlog = manifestlog

2193

self._manifestlog = manifestlog

2194

self._dir = dir

2194

self._dir = dir

2195

self._data = None

2195

self._data = None

2196

2197

self._node = node

2197

self._node = node

2198

2199

# TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that

2199

# TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that

2200

# we can instantiate treemanifestctx objects for directories we don't

2200

# we can instantiate treemanifestctx objects for directories we don't

2201

# have on disk.

2201

# have on disk.

2202

# self.p1, self.p2 = store.parents(node)

2202

# self.p1, self.p2 = store.parents(node)

2203

# rev = store.rev(node)

2203

# rev = store.rev(node)

2204

# self.linkrev = store.linkrev(rev)

2204

# self.linkrev = store.linkrev(rev)

2205

2206

def _storage(self):

2206

def _storage(self):

2207

narrowmatch = self._manifestlog._narrowmatch

2207

narrowmatch = self._manifestlog._narrowmatch

2208

if not narrowmatch.always():

2208

if not narrowmatch.always():

2209

if not narrowmatch.visitdir(self._dir[:-1]):

2209

if not narrowmatch.visitdir(self._dir[:-1]):

2210

return excludedmanifestrevlog(

2210

return excludedmanifestrevlog(

2211

self._manifestlog.nodeconstants, self._dir

2211

self._manifestlog.nodeconstants, self._dir

2212

)

2212

)

2213

return self._manifestlog.getstorage(self._dir)

2213

return self._manifestlog.getstorage(self._dir)

2214

2215

def read(self):

2215

def read(self):

2216

if self._data is None:

2216

if self._data is None:

2217

store = self._storage()

2217

store = self._storage()

2218

if self._node == self._manifestlog.nodeconstants.nullid:

2218

if self._node == self._manifestlog.nodeconstants.nullid:

2219

self._data = treemanifest(self._manifestlog.nodeconstants)

2219

self._data = treemanifest(self._manifestlog.nodeconstants)

2220

# TODO accessing non-public API

2220

# TODO accessing non-public API

2221

elif store._treeondisk:

2221

elif store._treeondisk:

2222

m = treemanifest(self._manifestlog.nodeconstants, dir=self._dir)

2222

m = treemanifest(self._manifestlog.nodeconstants, dir=self._dir)

2223

2224

def gettext():

2224

def gettext():

2225

return store.revision(self._node)

2225

return store.revision(self._node)

2226

2227

def readsubtree(dir, subm):

2227

def readsubtree(dir, subm):

2228

# Set verify to False since we need to be able to create

2228

# Set verify to False since we need to be able to create

2229

# subtrees for trees that don't exist on disk.

2229

# subtrees for trees that don't exist on disk.

2230

return self._manifestlog.get(dir, subm, verify=False).read()

2230

return self._manifestlog.get(dir, subm, verify=False).read()

2231

2232

m.read(gettext, readsubtree)

2232

m.read(gettext, readsubtree)

2233

m.setnode(self._node)

2233

m.setnode(self._node)

2234

self._data = m

2234

self._data = m

2235

else:

2235

else:

2236

if self._node in store.fulltextcache:

2236

if self._node in store.fulltextcache:

2237

text = pycompat.bytestr(store.fulltextcache[self._node])

2237

text = pycompat.bytestr(store.fulltextcache[self._node])

2238

else:

2238

else:

2239

text = store.revision(self._node)

2239

text = store.revision(self._node)

2240

arraytext = bytearray(text)

2240

arraytext = bytearray(text)

2241

store.fulltextcache[self._node] = arraytext

2241

store.fulltextcache[self._node] = arraytext

2242

self._data = treemanifest(

2242

self._data = treemanifest(

2243

self._manifestlog.nodeconstants, dir=self._dir, text=text

2243

self._manifestlog.nodeconstants, dir=self._dir, text=text

2244

)

2244

)

2245

2246

return self._data

2246

return self._data

2247

2248

def node(self):

2248

def node(self):

2249

return self._node

2249

return self._node

2250

2251

def copy(self):

2251

def copy(self):

2252

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2252

memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)

2253

memmf._treemanifest = self.read().copy()

2253

memmf._treemanifest = self.read().copy()

2254

return memmf

2254

return memmf

2255

2256

@propertycache

2256

@propertycache

2257

def parents(self):

2257

def parents(self):

2258

return self._storage().parents(self._node)

2258

return self._storage().parents(self._node)

2259

2260

def readdelta(self, shallow=False):

2260

def readdelta(self, shallow=False):

2261

"""Returns a manifest containing just the entries that are present

2261

"""Returns a manifest containing just the entries that are present

2262

in this manifest, but not in its p1 manifest. This is efficient to read

2262

in this manifest, but not in its p1 manifest. This is efficient to read

2263

if the revlog delta is already p1.

2263

if the revlog delta is already p1.

2264

2265

If `shallow` is True, this will read the delta for this directory,

2265

If `shallow` is True, this will read the delta for this directory,

2266

without recursively reading subdirectory manifests. Instead, any

2266

without recursively reading subdirectory manifests. Instead, any

2267

subdirectory entry will be reported as it appears in the manifest, i.e.

2267

subdirectory entry will be reported as it appears in the manifest, i.e.

2268

the subdirectory will be reported among files and distinguished only by

2268

the subdirectory will be reported among files and distinguished only by

2269

its 't' flag.

2269

its 't' flag.

2270

"""

2270

"""

2271

store = self._storage()

2271

store = self._storage()

2272

if shallow:

2272

if shallow:

2273

r = store.rev(self._node)

2273

r = store.rev(self._node)

2274

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2274

d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))

2275

return manifestdict(store.nodeconstants.nodelen, d)

2275

return manifestdict(store.nodeconstants.nodelen, d)

2276

else:

2276

else:

2277

# Need to perform a slow delta

2277

# Need to perform a slow delta

2278

r0 = store.deltaparent(store.rev(self._node))

2278

r0 = store.deltaparent(store.rev(self._node))

2279

m0 = self._manifestlog.get(self._dir, store.node(r0)).read()

2279

m0 = self._manifestlog.get(self._dir, store.node(r0)).read()

2280

m1 = self.read()

2280

m1 = self.read()

2281

md = treemanifest(self._manifestlog.nodeconstants, dir=self._dir)

2281

md = treemanifest(self._manifestlog.nodeconstants, dir=self._dir)

2282

for f, ((n0, fl0), (n1, fl1)) in m0.diff(m1).items():

2282

for f, ((n0, fl0), (n1, fl1)) in m0.diff(m1).items():

2283

if n1:

2283

if n1:

2284

md[f] = n1

2284

md[f] = n1

2285

if fl1:

2285

if fl1:

2286

md.setflag(f, fl1)

2286

md.setflag(f, fl1)

2287

return md

2287

return md

2288

2289

def readfast(self, shallow=False):

2289

def readfast(self, shallow=False):

2290

"""Calls either readdelta or read, based on which would be less work.

2290

"""Calls either readdelta or read, based on which would be less work.

2291

readdelta is called if the delta is against the p1, and therefore can be

2291

readdelta is called if the delta is against the p1, and therefore can be

2292

read quickly.

2292

read quickly.

2293

2294

If `shallow` is True, it only returns the entries from this manifest,

2294

If `shallow` is True, it only returns the entries from this manifest,

2295

and not any submanifests.

2295

and not any submanifests.

2296

"""

2296

"""

2297

store = self._storage()

2297

store = self._storage()

2298

r = store.rev(self._node)

2298

r = store.rev(self._node)

2299

deltaparent = store.deltaparent(r)

2299

deltaparent = store.deltaparent(r)

2300

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2300

if deltaparent != nullrev and deltaparent in store.parentrevs(r):

2301

return self.readdelta(shallow=shallow)

2301

return self.readdelta(shallow=shallow)

2302

2303

if shallow:

2303

if shallow:

2304

return manifestdict(

2304

return manifestdict(

2305

store.nodeconstants.nodelen, store.revision(self._node)

2305

store.nodeconstants.nodelen, store.revision(self._node)

2306

)

2306

)

2307

else:

2307

else:

2308

return self.read()

2308

return self.read()

2309

2310

def find(self, key):

2310

def find(self, key):

2311

return self.read().find(key)

2311

return self.read().find(key)

2312

2313

2314

class excludeddir(treemanifest):

2314

class excludeddir(treemanifest):

2315

"""Stand-in for a directory that is excluded from the repository.

2315

"""Stand-in for a directory that is excluded from the repository.

2316

2317

With narrowing active on a repository that uses treemanifests,

2317

With narrowing active on a repository that uses treemanifests,

2318

some of the directory revlogs will be excluded from the resulting

2318

some of the directory revlogs will be excluded from the resulting

2319

clone. This is a huge storage win for clients, but means we need

2319

clone. This is a huge storage win for clients, but means we need

2320

some sort of pseudo-manifest to surface to internals so we can

2320

some sort of pseudo-manifest to surface to internals so we can

2321

detect a merge conflict outside the narrowspec. That's what this

2321

detect a merge conflict outside the narrowspec. That's what this

2322

class is: it stands in for a directory whose node is known, but

2322

class is: it stands in for a directory whose node is known, but

2323

whose contents are unknown.

2323

whose contents are unknown.

2324

"""

2324

"""

2325

2326

def __init__(self, nodeconstants, dir, node):

2326

def __init__(self, nodeconstants, dir, node):

2327

super(excludeddir, self).__init__(nodeconstants, dir)

2327

super(excludeddir, self).__init__(nodeconstants, dir)

2328

self._node = node

2328

self._node = node

2329

# Add an empty file, which will be included by iterators and such,

2329

# Add an empty file, which will be included by iterators and such,

2330

# appearing as the directory itself (i.e. something like "dir/")

2330

# appearing as the directory itself (i.e. something like "dir/")

2331

self._files[b''] = node

2331

self._files[b''] = node

2332

self._flags[b''] = b't'

2332

self._flags[b''] = b't'

2333

2334

# Manifests outside the narrowspec should never be modified, so avoid

2334

# Manifests outside the narrowspec should never be modified, so avoid

2335

# copying. This makes a noticeable difference when there are very many

2335

# copying. This makes a noticeable difference when there are very many

2336

# directories outside the narrowspec. Also, it makes sense for the copy to

2336

# directories outside the narrowspec. Also, it makes sense for the copy to

2337

# be of the same type as the original, which would not happen with the

2337

# be of the same type as the original, which would not happen with the

2338

# super type's copy().

2338

# super type's copy().

2339

def copy(self):

2339

def copy(self):

2340

return self

2340

return self

2341

2342

2343

class excludeddirmanifestctx(treemanifestctx):

2343

class excludeddirmanifestctx(treemanifestctx):

2344

"""context wrapper for excludeddir - see that docstring for rationale"""

2344

"""context wrapper for excludeddir - see that docstring for rationale"""

2345

2346

def __init__(self, nodeconstants, dir, node):

2346

def __init__(self, nodeconstants, dir, node):

2347

self.nodeconstants = nodeconstants

2347

self.nodeconstants = nodeconstants

2348

self._dir = dir

2348

self._dir = dir

2349

self._node = node

2349

self._node = node

2350

2351

def read(self):

2351

def read(self):

2352

return excludeddir(self.nodeconstants, self._dir, self._node)

2352

return excludeddir(self.nodeconstants, self._dir, self._node)

2353

2354

def readfast(self, shallow=False):

2354

def readfast(self, shallow=False):

2355

# special version of readfast since we don't have underlying storage

2355

# special version of readfast since we don't have underlying storage

2356

return self.read()

2356

return self.read()

2357

2358

def write(self, *args):

2358

def write(self, *args):

2359

raise error.ProgrammingError(

2359

raise error.ProgrammingError(

2360

b'attempt to write manifest from excluded dir %s' % self._dir

2360

b'attempt to write manifest from excluded dir %s' % self._dir

2361

)

2361

)

2362

2363

2364

class excludedmanifestrevlog(manifestrevlog):

2364

class excludedmanifestrevlog(manifestrevlog):

2365

"""Stand-in for excluded treemanifest revlogs.

2365

"""Stand-in for excluded treemanifest revlogs.

2366

2367

When narrowing is active on a treemanifest repository, we'll have

2367

When narrowing is active on a treemanifest repository, we'll have

2368

references to directories we can't see due to the revlog being

2368

references to directories we can't see due to the revlog being

2369

skipped. This class exists to conform to the manifestrevlog

2369

skipped. This class exists to conform to the manifestrevlog

2370

interface for those directories and proactively prevent writes to

2370

interface for those directories and proactively prevent writes to

2371

outside the narrowspec.

2371

outside the narrowspec.

2372

"""

2372

"""

2373

2374

def __init__(self, nodeconstants, dir):

2374

def __init__(self, nodeconstants, dir):

2375

self.nodeconstants = nodeconstants

2375

self.nodeconstants = nodeconstants

2376

self._dir = dir

2376

self._dir = dir

2377

2378

def __len__(self):

2378

def __len__(self):

2379

raise error.ProgrammingError(

2379

raise error.ProgrammingError(

2380

b'attempt to get length of excluded dir %s' % self._dir

2380

b'attempt to get length of excluded dir %s' % self._dir

2381

)

2381

)

2382

2383

def rev(self, node):

2383

def rev(self, node):

2384

raise error.ProgrammingError(

2384

raise error.ProgrammingError(

2385

b'attempt to get rev from excluded dir %s' % self._dir

2385

b'attempt to get rev from excluded dir %s' % self._dir

2386

)

2386

)

2387

2388

def linkrev(self, node):

2388

def linkrev(self, node):

2389

raise error.ProgrammingError(

2389

raise error.ProgrammingError(

2390

b'attempt to get linkrev from excluded dir %s' % self._dir

2390

b'attempt to get linkrev from excluded dir %s' % self._dir

2391

)

2391

)

2392

2393

def node(self, rev):

2393

def node(self, rev):

2394

raise error.ProgrammingError(

2394

raise error.ProgrammingError(

2395

b'attempt to get node from excluded dir %s' % self._dir

2395

b'attempt to get node from excluded dir %s' % self._dir

2396

)

2396

)

2397

2398

def add(self, *args, **kwargs):

2398

def add(self, *args, **kwargs):

2399

# We should never write entries in dirlogs outside the narrow clone.

2399

# We should never write entries in dirlogs outside the narrow clone.

2400

# However, the method still gets called from writesubtree() in

2400

# However, the method still gets called from writesubtree() in

2401

# _addtree(), so we need to handle it. We should possibly make that

2401

# _addtree(), so we need to handle it. We should possibly make that

2402

# avoid calling add() with a clean manifest (_dirty is always False

2402

# avoid calling add() with a clean manifest (_dirty is always False

2403

# in excludeddir instances).

2403

# in excludeddir instances).

2404

pass

2404

pass

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # manifest.py - manifest revision class for mercurial
             #
             # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             import heapq
             import itertools
             import struct
             import weakref
             from .i18n import _
             from .node import (
                 bin,
                 hex,
                 nullrev,
             )
             from . import (
                 encoding,
                 error,
                 match as matchmod,
                 mdiff,
                 pathutil,
                 policy,
                 pycompat,
                 revlog,
                 util,
             )
             from .interfaces import (
                 repository,
                 util as interfaceutil,
             )
             from .revlogutils import (
                 constants as revlog_constants,
             )
             parsers = policy.importmod('parsers')
             propertycache = util.propertycache
             # Allow tests to more easily test the alternate path in manifestdict.fastdelta()
             FASTDELTA_TEXTDIFF_THRESHOLD = 1000
             def _parse(nodelen, data):
                 # This method does a little bit of excessive-looking
                 # precondition checking. This is so that the behavior of this
                 # class exactly matches its C counterpart to try and help
                 # prevent surprise breakage for anyone that develops against
                 # the pure version.
                 if data and data[-1:] != b'\n':
                     raise ValueError(b'Manifest did not end in a newline.')
                 prev = None
                 for l in data.splitlines():
                     if prev is not None and prev > l:
                         raise ValueError(b'Manifest lines not in sorted order.')
                     prev = l
                     f, n = l.split(b'\0')
                     nl = len(n)
                     flags = n[-1:]
                     if flags in _manifestflags:
                         n = n[:-1]
                         nl -= 1
                     else:
                         flags = b''
                     if nl != 2 * nodelen:
                         raise ValueError(b'Invalid manifest line')
                     yield f, bin(n), flags
             def _text(it):
                 files = []
                 lines = []
                 for f, n, fl in it:
                     files.append(f)
                     # if this is changed to support newlines in filenames,
                     # be sure to check the templates/ dir again (especially *-raw.tmpl)
                     lines.append(b"%s\0%s%s\n" % (f, hex(n), fl))
                 _checkforbidden(files)
                 return b''.join(lines)
             class lazymanifestiter:
                 def __init__(self, lm):
                     self.pos = 0
                     self.lm = lm
                 def __iter__(self):
                     return self
                 def next(self):
                     try:
                         data, pos = self.lm._get(self.pos)
                     except IndexError:
                         raise StopIteration
                     if pos == -1:
                         self.pos += 1
                         return data[0]
                     self.pos += 1
                     zeropos = data.find(b'\x00', pos)
                     return data[pos:zeropos]
                 __next__ = next
             class lazymanifestiterentries:
                 def __init__(self, lm):
                     self.lm = lm
                     self.pos = 0
                 def __iter__(self):
                     return self
                 def next(self):
                     try:
                         data, pos = self.lm._get(self.pos)
                     except IndexError:
                         raise StopIteration
                     if pos == -1:
                         self.pos += 1
                         return data
                     zeropos = data.find(b'\x00', pos)
                     nlpos = data.find(b'\n', pos)
                     if zeropos == -1 or nlpos == -1 or nlpos < zeropos:
                         raise error.StorageError(b'Invalid manifest line')
                     flags = data[nlpos - 1 : nlpos]
                     if flags in _manifestflags:
                         hlen = nlpos - zeropos - 2
                     else:
                         hlen = nlpos - zeropos - 1
                         flags = b''
                     if hlen != 2 * self.lm._nodelen:
                         raise error.StorageError(b'Invalid manifest line')
                     hashval = unhexlify(
                         data, self.lm.extrainfo[self.pos], zeropos + 1, hlen
                     )
                     self.pos += 1
                     return (data[pos:zeropos], hashval, flags)
                 __next__ = next
-            def unhexlify(data, extra, pos, length):
+            def unhexlify(data: bytes, extra: int, pos, length: int):
                 s = bin(data[pos : pos + length])
                 if extra:
-                    s += chr(extra & 0xFF)
+                    s += bytes([extra & 0xFF])
                 return s
             def _cmp(a, b):
                 return (a > b) - (a < b)
             _manifestflags = {b'', b'l', b't', b'x'}
             class _lazymanifest:
                 """A pure python manifest backed by a byte string.  It is supplimented with
                 internal lists as it is modified, until it is compacted back to a pure byte
                 string.
                 ``data`` is the initial manifest data.
                 ``positions`` is a list of offsets, one per manifest entry.  Positive
                 values are offsets into ``data``, negative values are offsets into the
                 ``extradata`` list.  When an entry is removed, its entry is dropped from
                 ``positions``.  The values are encoded such that when walking the list and
                 indexing into ``data`` or ``extradata`` as appropriate, the entries are
                 sorted by filename.
                 ``extradata`` is a list of (key, hash, flags) for entries that were added or
                 modified since the manifest was created or compacted.
                 """
                 def __init__(
                     self,
                     nodelen,
                     data,
                     positions=None,
                     extrainfo=None,
                     extradata=None,
                     hasremovals=False,
                 ):
                     self._nodelen = nodelen
                     if positions is None:
                         self.positions = self.findlines(data)
                         self.extrainfo = [0] * len(self.positions)
                         self.data = data
                         self.extradata = []
                         self.hasremovals = False
                     else:
                         self.positions = positions[:]
                         self.extrainfo = extrainfo[:]
                         self.extradata = extradata[:]
                         self.data = data
                         self.hasremovals = hasremovals
                 def findlines(self, data):
                     if not data:
                         return []
                     pos = data.find(b"\n")
                     if pos == -1 or data[-1:] != b'\n':
                         raise ValueError(b"Manifest did not end in a newline.")
                     positions = [0]
                     prev = data[: data.find(b'\x00')]
                     while pos < len(data) - 1 and pos != -1:
                         positions.append(pos + 1)
                         nexts = data[pos + 1 : data.find(b'\x00', pos + 1)]
                         if nexts < prev:
                             raise ValueError(b"Manifest lines not in sorted order.")
                         prev = nexts
                         pos = data.find(b"\n", pos + 1)
                     return positions
                 def _get(self, index):
                     # get the position encoded in pos:
                     #   positive number is an index in 'data'
                     #   negative number is in extrapieces
                     pos = self.positions[index]
                     if pos >= 0:
                         return self.data, pos
                     return self.extradata[-pos - 1], -1
                 def _getkey(self, pos):
                     if pos >= 0:
                         return self.data[pos : self.data.find(b'\x00', pos + 1)]
                     return self.extradata[-pos - 1][0]
                 def bsearch(self, key):
                     first = 0
                     last = len(self.positions) - 1
                     while first <= last:
                         midpoint = (first + last) // 2
                         nextpos = self.positions[midpoint]
                         candidate = self._getkey(nextpos)
                         r = _cmp(key, candidate)
                         if r == 0:
                             return midpoint
                         else:
                             if r < 0:
                                 last = midpoint - 1
                             else:
                                 first = midpoint + 1
                     return -1
                 def bsearch2(self, key):
                     # same as the above, but will always return the position
                     # done for performance reasons
                     first = 0
                     last = len(self.positions) - 1
                     while first <= last:
                         midpoint = (first + last) // 2
                         nextpos = self.positions[midpoint]
                         candidate = self._getkey(nextpos)
                         r = _cmp(key, candidate)
                         if r == 0:
                             return (midpoint, True)
                         else:
                             if r < 0:
                                 last = midpoint - 1
                             else:
                                 first = midpoint + 1
                     return (first, False)
                 def __contains__(self, key):
                     return self.bsearch(key) != -1
                 def __getitem__(self, key):
                     if not isinstance(key, bytes):
                         raise TypeError(b"getitem: manifest keys must be a bytes.")
                     needle = self.bsearch(key)
                     if needle == -1:
                         raise KeyError
                     data, pos = self._get(needle)
                     if pos == -1:
                         return (data[1], data[2])
                     zeropos = data.find(b'\x00', pos)
                     nlpos = data.find(b'\n', zeropos)
                     assert 0 <= needle <= len(self.positions)
                     assert len(self.extrainfo) == len(self.positions)
                     if zeropos == -1 or nlpos == -1 or nlpos < zeropos:
                         raise error.StorageError(b'Invalid manifest line')
                     hlen = nlpos - zeropos - 1
                     flags = data[nlpos - 1 : nlpos]
                     if flags in _manifestflags:
                         hlen -= 1
                     else:
                         flags = b''
                     if hlen != 2 * self._nodelen:
                         raise error.StorageError(b'Invalid manifest line')
                     hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, hlen)
                     return (hashval, flags)
                 def __delitem__(self, key):
                     needle, found = self.bsearch2(key)
                     if not found:
                         raise KeyError
                     cur = self.positions[needle]
                     self.positions = self.positions[:needle] + self.positions[needle + 1 :]
                     self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1 :]
                     if cur >= 0:
                         # This does NOT unsort the list as far as the search functions are
                         # concerned, as they only examine lines mapped by self.positions.
                         self.data = self.data[:cur] + b'\x00' + self.data[cur + 1 :]
                         self.hasremovals = True
                 def __setitem__(self, key, value):
                     if not isinstance(key, bytes):
                         raise TypeError(b"setitem: manifest keys must be a byte string.")
                     if not isinstance(value, tuple) or len(value) != 2:
                         raise TypeError(
                             b"Manifest values must be a tuple of (node, flags)."
                         )
                     hashval = value[0]
                     if not isinstance(hashval, bytes) or len(hashval) not in (20, 32):
                         raise TypeError(b"node must be a 20-byte or 32-byte byte string")
                     flags = value[1]
                     if not isinstance(flags, bytes) or len(flags) > 1:
                         raise TypeError(b"flags must a 0 or 1 byte string, got %r", flags)
                     needle, found = self.bsearch2(key)
                     if found:
                         # put the item
                         pos = self.positions[needle]
                         if pos < 0:
                             self.extradata[-pos - 1] = (key, hashval, value[1])
                         else:
                             # just don't bother
                             self.extradata.append((key, hashval, value[1]))
                             self.positions[needle] = -len(self.extradata)
                     else:
                         # not found, put it in with extra positions
                         self.extradata.append((key, hashval, value[1]))
                         self.positions = (
                             self.positions[:needle]
                             + [-len(self.extradata)]
                             + self.positions[needle:]
                         )
                         self.extrainfo = (
                             self.extrainfo[:needle] + [0] + self.extrainfo[needle:]
                         )
                 def copy(self):
                     # XXX call _compact like in C?
                     return _lazymanifest(
                         self._nodelen,
                         self.data,
                         self.positions,
                         self.extrainfo,
                         self.extradata,
                         self.hasremovals,
                     )
                 def _compact(self):
                     # hopefully not called TOO often
                     if len(self.extradata) == 0 and not self.hasremovals:
                         return
                     l = []
                     i = 0
                     offset = 0
                     self.extrainfo = [0] * len(self.positions)
                     while i < len(self.positions):
                         if self.positions[i] >= 0:
                             cur = self.positions[i]
                             last_cut = cur
                             # Collect all contiguous entries in the buffer at the current
                             # offset, breaking out only for added/modified items held in
                             # extradata, or a deleted line prior to the next position.
                             while True:
                                 self.positions[i] = offset
                                 i += 1
                                 if i == len(self.positions) or self.positions[i] < 0:
                                     break
                                 # A removed file has no positions[] entry, but does have an
                                 # overwritten first byte.  Break out and find the end of the
                                 # current good entry/entries if there is a removed file
                                 # before the next position.
                                 if (
                                     self.hasremovals
                                     and self.data.find(b'\n\x00', cur, self.positions[i])
                                     != -1
                                 ):
                                     break
                                 offset += self.positions[i] - cur
                                 cur = self.positions[i]
                             end_cut = self.data.find(b'\n', cur)
                             if end_cut != -1:
                                 end_cut += 1
                             offset += end_cut - cur
                             l.append(self.data[last_cut:end_cut])
                         else:
                             while i < len(self.positions) and self.positions[i] < 0:
                                 cur = self.positions[i]
                                 t = self.extradata[-cur - 1]
                                 l.append(self._pack(t))
                                 self.positions[i] = offset
                                 # Hashes are either 20 bytes (old sha1s) or 32
                                 # bytes (new non-sha1).
                                 hlen = 20
                                 if len(t[1]) > 25:
                                     hlen = 32
                                 if len(t[1]) > hlen:
                                     self.extrainfo[i] = ord(t[1][hlen + 1])
                                 offset += len(l[-1])
                                 i += 1
                     self.data = b''.join(l)
                     self.hasremovals = False
                     self.extradata = []
                 def _pack(self, d):
                     n = d[1]
                     assert len(n) in (20, 32)
                     return d[0] + b'\x00' + hex(n) + d[2] + b'\n'
                 def text(self):
                     self._compact()
                     return self.data
                 def diff(self, m2, clean=False):
                     '''Finds changes between the current manifest and m2.'''
                     # XXX think whether efficiency matters here
                     diff = {}
                     for fn, e1, flags in self.iterentries():
                         if fn not in m2:
                             diff[fn] = (e1, flags), (None, b'')
                         else:
                             e2 = m2[fn]
                             if (e1, flags) != e2:
                                 diff[fn] = (e1, flags), e2
                             elif clean:
                                 diff[fn] = None
                     for fn, e2, flags in m2.iterentries():
                         if fn not in self:
                             diff[fn] = (None, b''), (e2, flags)
                     return diff
                 def iterentries(self):
                     return lazymanifestiterentries(self)
                 def iterkeys(self):
                     return lazymanifestiter(self)
                 def __iter__(self):
                     return lazymanifestiter(self)
                 def __len__(self):
                     return len(self.positions)
                 def filtercopy(self, filterfn):
                     # XXX should be optimized
                     c = _lazymanifest(self._nodelen, b'')
                     for f, n, fl in self.iterentries():
                         if filterfn(f):
                             c[f] = n, fl
                     return c
             try:
                 _lazymanifest = parsers.lazymanifest
             except AttributeError:
                 pass
             @interfaceutil.implementer(repository.imanifestdict)
             class manifestdict:
                 def __init__(self, nodelen, data=b''):
                     self._nodelen = nodelen
                     self._lm = _lazymanifest(nodelen, data)
                 def __getitem__(self, key):
                     return self._lm[key][0]
                 def find(self, key):
                     return self._lm[key]
                 def __len__(self):
                     return len(self._lm)
                 def __nonzero__(self):
                     # nonzero is covered by the __len__ function, but implementing it here
                     # makes it easier for extensions to override.
                     return len(self._lm) != 0
                 __bool__ = __nonzero__
                 def set(self, key, node, flags):
                     self._lm[key] = node, flags
                 def __setitem__(self, key, node):
                     self._lm[key] = node, self.flags(key)
                 def __contains__(self, key):
                     if key is None:
                         return False
                     return key in self._lm
                 def __delitem__(self, key):
                     del self._lm[key]
                 def __iter__(self):
                     return self._lm.__iter__()
                 def iterkeys(self):
                     return self._lm.iterkeys()
                 def keys(self):
                     return list(self.iterkeys())
                 def filesnotin(self, m2, match=None):
                     '''Set of files in this manifest that are not in the other'''
                     if match is not None:
                         match = matchmod.badmatch(match, lambda path, msg: None)
                         sm2 = set(m2.walk(match))
                         return {f for f in self.walk(match) if f not in sm2}
                     return {f for f in self if f not in m2}
                 @propertycache
                 def _dirs(self):
                     return pathutil.dirs(self)
                 def dirs(self):
                     return self._dirs
                 def hasdir(self, dir):
                     return dir in self._dirs
                 def _filesfastpath(self, match):
                     """Checks whether we can correctly and quickly iterate over matcher
                     files instead of over manifest files."""
                     files = match.files()
                     return len(files) < 100 and (
                         match.isexact()
                         or (match.prefix() and all(fn in self for fn in files))
                     )
                 def walk(self, match):
                     """Generates matching file names.
                     Equivalent to manifest.matches(match).iterkeys(), but without creating
                     an entirely new manifest.
                     It also reports nonexistent files by marking them bad with match.bad().
                     """
                     if match.always():
                         for f in iter(self):
                             yield f
                         return
                     fset = set(match.files())
                     # avoid the entire walk if we're only looking for specific files
                     if self._filesfastpath(match):
                         for fn in sorted(fset):
                             if fn in self:
                                 yield fn
                         return
                     for fn in self:
                         if fn in fset:
                             # specified pattern is the exact name
                             fset.remove(fn)
                         if match(fn):
                             yield fn
                     # for dirstate.walk, files=[''] means "walk the whole tree".
                     # follow that here, too
                     fset.discard(b'')
                     for fn in sorted(fset):
                         if not self.hasdir(fn):
                             match.bad(fn, None)
                 def _matches(self, match):
                     '''generate a new manifest filtered by the match argument'''
                     if match.always():
                         return self.copy()
                     if self._filesfastpath(match):
                         m = manifestdict(self._nodelen)
                         lm = self._lm
                         for fn in match.files():
                             if fn in lm:
                                 m._lm[fn] = lm[fn]
                         return m
                     m = manifestdict(self._nodelen)
                     m._lm = self._lm.filtercopy(match)
                     return m
                 def diff(self, m2, match=None, clean=False):
                     """Finds changes between the current manifest and m2.
                     Args:
                       m2: the manifest to which this manifest should be compared.
                       clean: if true, include files unchanged between these manifests
                              with a None value in the returned dictionary.
                     The result is returned as a dict with filename as key and
                     values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
                     nodeid in the current/other manifest and fl1/fl2 is the flag
                     in the current/other manifest. Where the file does not exist,
                     the nodeid will be None and the flags will be the empty
                     string.
                     """
                     if match:
                         m1 = self._matches(match)
                         m2 = m2._matches(match)
                         return m1.diff(m2, clean=clean)
                     return self._lm.diff(m2._lm, clean)
                 def setflag(self, key, flag):
                     if flag not in _manifestflags:
                         raise TypeError(b"Invalid manifest flag set.")
                     self._lm[key] = self[key], flag
                 def get(self, key, default=None):
                     try:
                         return self._lm[key][0]
                     except KeyError:
                         return default
                 def flags(self, key):
                     try:
                         return self._lm[key][1]
                     except KeyError:
                         return b''
                 def copy(self):
                     c = manifestdict(self._nodelen)
                     c._lm = self._lm.copy()
                     return c
                 def items(self):
                     return (x[:2] for x in self._lm.iterentries())
                 def iteritems(self):
                     return (x[:2] for x in self._lm.iterentries())
                 def iterentries(self):
                     return self._lm.iterentries()
                 def text(self):
                     # most likely uses native version
                     return self._lm.text()
                 def fastdelta(self, base, changes):
                     """Given a base manifest text as a bytearray and a list of changes
                     relative to that text, compute a delta that can be used by revlog.
                     """
                     delta = []
                     dstart = None
                     dend = None
                     dline = [b""]
                     start = 0
                     # zero copy representation of base as a buffer
                     addbuf = util.buffer(base)
                     changes = list(changes)
                     if len(changes) < FASTDELTA_TEXTDIFF_THRESHOLD:
                         # start with a readonly loop that finds the offset of
                         # each line and creates the deltas
                         for f, todelete in changes:
                             # bs will either be the index of the item or the insert point
                             start, end = _msearch(addbuf, f, start)
                             if not todelete:
                                 h, fl = self._lm[f]
                                 l = b"%s\0%s%s\n" % (f, hex(h), fl)
                             else:
                                 if start == end:
                                     # item we want to delete was not found, error out
                                     raise AssertionError(
                                         _(b"failed to remove %s from manifest") % f
                                     )
                                 l = b""
                             if dstart is not None and dstart <= start and dend >= start:
                                 if dend < end:
                                     dend = end
                                 if l:
                                     dline.append(l)
                             else:
                                 if dstart is not None:
                                     delta.append([dstart, dend, b"".join(dline)])
                                 dstart = start
                                 dend = end
                                 dline = [l]
                         if dstart is not None:
                             delta.append([dstart, dend, b"".join(dline)])
                         # apply the delta to the base, and get a delta for addrevision
                         deltatext, arraytext = _addlistdelta(base, delta)
                     else:
                         # For large changes, it's much cheaper to just build the text and
                         # diff it.
                         arraytext = bytearray(self.text())
                         deltatext = mdiff.textdiff(
                             util.buffer(base), util.buffer(arraytext)
                         )
                     return arraytext, deltatext
             def _msearch(m, s, lo=0, hi=None):
                 """return a tuple (start, end) that says where to find s within m.
                 If the string is found m[start:end] are the line containing
                 that string.  If start == end the string was not found and
                 they indicate the proper sorted insertion point.
                 m should be a buffer, a memoryview or a byte string.
                 s is a byte string"""
                 def advance(i, c):
                     while i < lenm and m[i : i + 1] != c:
                         i += 1
                     return i
                 if not s:
                     return (lo, lo)
                 lenm = len(m)
                 if not hi:
                     hi = lenm
                 while lo < hi:
                     mid = (lo + hi) // 2
                     start = mid
                     while start > 0 and m[start - 1 : start] != b'\n':
                         start -= 1
                     end = advance(start, b'\0')
                     if bytes(m[start:end]) < s:
                         # we know that after the null there are 40 bytes of sha1
                         # this translates to the bisect lo = mid + 1
                         lo = advance(end + 40, b'\n') + 1
                     else:
                         # this translates to the bisect hi = mid
                         hi = start
                 end = advance(lo, b'\0')
                 found = m[lo:end]
                 if s == found:
                     # we know that after the null there are 40 bytes of sha1
                     end = advance(end + 40, b'\n')
                     return (lo, end + 1)
                 else:
                     return (lo, lo)
             def _checkforbidden(l):
                 """Check filenames for illegal characters."""
                 for f in l:
                     if b'\n' in f or b'\r' in f:
                         raise error.StorageError(
                             _(b"'\\n' and '\\r' disallowed in filenames: %r")
                             % pycompat.bytestr(f)
                         )
             # apply the changes collected during the bisect loop to our addlist
             # return a delta suitable for addrevision
             def _addlistdelta(addlist, x):
                 # for large addlist arrays, building a new array is cheaper
                 # than repeatedly modifying the existing one
                 currentposition = 0
                 newaddlist = bytearray()
                 for start, end, content in x:
                     newaddlist += addlist[currentposition:start]
                     if content:
                         newaddlist += bytearray(content)
                     currentposition = end
                 newaddlist += addlist[currentposition:]
                 deltatext = b"".join(
                     struct.pack(b">lll", start, end, len(content)) + content
                     for start, end, content in x
                 )
                 return deltatext, newaddlist
             def _splittopdir(f):
                 if b'/' in f:
                     dir, subpath = f.split(b'/', 1)
                     return dir + b'/', subpath
                 else:
                     return b'', f
             _noop = lambda s: None
             @interfaceutil.implementer(repository.imanifestdict)
             class treemanifest:
                 def __init__(self, nodeconstants, dir=b'', text=b''):
                     self._dir = dir
                     self.nodeconstants = nodeconstants
                     self._node = self.nodeconstants.nullid
                     self._nodelen = self.nodeconstants.nodelen
                     self._loadfunc = _noop
                     self._copyfunc = _noop
                     self._dirty = False
                     self._dirs = {}
                     self._lazydirs = {}
                     # Using _lazymanifest here is a little slower than plain old dicts
                     self._files = {}
                     self._flags = {}
                     if text:
                         def readsubtree(subdir, subm):
                             raise AssertionError(
                                 b'treemanifest constructor only accepts flat manifests'
                             )
                         self.parse(text, readsubtree)
                         self._dirty = True  # Mark flat manifest dirty after parsing
                 def _subpath(self, path):
                     return self._dir + path
                 def _loadalllazy(self):
                     selfdirs = self._dirs
                     subpath = self._subpath
                     for d, (node, readsubtree, docopy) in self._lazydirs.items():
                         if docopy:
                             selfdirs[d] = readsubtree(subpath(d), node).copy()
                         else:
                             selfdirs[d] = readsubtree(subpath(d), node)
                     self._lazydirs = {}
                 def _loadlazy(self, d):
                     v = self._lazydirs.get(d)
                     if v:
                         node, readsubtree, docopy = v
                         if docopy:
                             self._dirs[d] = readsubtree(self._subpath(d), node).copy()
                         else:
                             self._dirs[d] = readsubtree(self._subpath(d), node)
                         del self._lazydirs[d]
                 def _loadchildrensetlazy(self, visit):
                     if not visit:
                         return None
                     if visit == b'all' or visit == b'this':
                         self._loadalllazy()
                         return None
                     loadlazy = self._loadlazy
                     for k in visit:
                         loadlazy(k + b'/')
                     return visit
                 def _loaddifflazy(self, t1, t2):
                     """load items in t1 and t2 if they're needed for diffing.
                     The criteria currently is:
                     - if it's not present in _lazydirs in either t1 or t2, load it in the
                       other (it may already be loaded or it may not exist, doesn't matter)
                     - if it's present in _lazydirs in both, compare the nodeid; if it
                       differs, load it in both
                     """
                     toloadlazy = []
                     for d, v1 in t1._lazydirs.items():
                         v2 = t2._lazydirs.get(d)
                         if not v2 or v2[0] != v1[0]:
                             toloadlazy.append(d)
                     for d, v1 in t2._lazydirs.items():
                         if d not in t1._lazydirs:
                             toloadlazy.append(d)
                     for d in toloadlazy:
                         t1._loadlazy(d)
                         t2._loadlazy(d)
                 def __len__(self):
                     self._load()
                     size = len(self._files)
                     self._loadalllazy()
                     for m in self._dirs.values():
                         size += m.__len__()
                     return size
                 def __nonzero__(self):
                     # Faster than "__len() != 0" since it avoids loading sub-manifests
                     return not self._isempty()
                 __bool__ = __nonzero__
                 def _isempty(self):
                     self._load()  # for consistency; already loaded by all callers
                     # See if we can skip loading everything.
                     if self._files or (
                         self._dirs and any(not m._isempty() for m in self._dirs.values())
                     ):
                         return False
                     self._loadalllazy()
                     return not self._dirs or all(m._isempty() for m in self._dirs.values())
                 @encoding.strmethod
                 def __repr__(self):
                     return (
                         b'<treemanifest dir=%s, node=%s, loaded=%r, dirty=%r at 0x%x>'
                         % (
                             self._dir,
                             hex(self._node),
                             bool(self._loadfunc is _noop),
                             self._dirty,
                             id(self),
                         )
                     )
                 def dir(self):
                     """The directory that this tree manifest represents, including a
                     trailing '/'. Empty string for the repo root directory."""
                     return self._dir
                 def node(self):
                     """This node of this instance. nullid for unsaved instances. Should
                     be updated when the instance is read or written from a revlog.
                     """
                     assert not self._dirty
                     return self._node
                 def setnode(self, node):
                     self._node = node
                     self._dirty = False
                 def iterentries(self):
                     self._load()
                     self._loadalllazy()
                     for p, n in sorted(
                         itertools.chain(self._dirs.items(), self._files.items())
                     ):
                         if p in self._files:
                             yield self._subpath(p), n, self._flags.get(p, b'')
                         else:
                             for x in n.iterentries():
                                 yield x
                 def items(self):
                     self._load()
                     self._loadalllazy()
                     for p, n in sorted(
                         itertools.chain(self._dirs.items(), self._files.items())
                     ):
                         if p in self._files:
                             yield self._subpath(p), n
                         else:
                             for f, sn in n.items():
                                 yield f, sn
                 iteritems = items
                 def iterkeys(self):
                     self._load()
                     self._loadalllazy()
                     for p in sorted(itertools.chain(self._dirs, self._files)):
                         if p in self._files:
                             yield self._subpath(p)
                         else:
                             for f in self._dirs[p]:
                                 yield f
                 def keys(self):
                     return list(self.iterkeys())
                 def __iter__(self):
                     return self.iterkeys()
                 def __contains__(self, f):
                     if f is None:
                         return False
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             return False
                         return self._dirs[dir].__contains__(subpath)
                     else:
                         return f in self._files
                 def get(self, f, default=None):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             return default
                         return self._dirs[dir].get(subpath, default)
                     else:
                         return self._files.get(f, default)
                 def __getitem__(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         return self._dirs[dir].__getitem__(subpath)
                     else:
                         return self._files[f]
                 def flags(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             return b''
                         return self._dirs[dir].flags(subpath)
                     else:
                         if f in self._lazydirs or f in self._dirs:
                             return b''
                         return self._flags.get(f, b'')
                 def find(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         return self._dirs[dir].find(subpath)
                     else:
                         return self._files[f], self._flags.get(f, b'')
                 def __delitem__(self, f):
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         self._dirs[dir].__delitem__(subpath)
                         # If the directory is now empty, remove it
                         if self._dirs[dir]._isempty():
                             del self._dirs[dir]
                     else:
                         del self._files[f]
                         if f in self._flags:
                             del self._flags[f]
                     self._dirty = True
                 def set(self, f, node, flags):
                     """Set both the node and the flags for path f."""
                     assert node is not None
                     if flags not in _manifestflags:
                         raise TypeError(b"Invalid manifest flag set.")
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             self._dirs[dir] = treemanifest(
                                 self.nodeconstants, self._subpath(dir)
                             )
                         self._dirs[dir].set(subpath, node, flags)
                     else:
                         assert len(node) in (20, 32)
                         self._files[f] = node
                         self._flags[f] = flags
                     self._dirty = True
                 def __setitem__(self, f, n):
                     assert n is not None
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             self._dirs[dir] = treemanifest(
                                 self.nodeconstants, self._subpath(dir)
                             )
                         self._dirs[dir].__setitem__(subpath, n)
                     else:
                         # manifest nodes are either 20 bytes or 32 bytes,
                         # depending on the hash in use. Assert this as historically
                         # sometimes extra bytes were added.
                         assert len(n) in (20, 32)
                         self._files[f] = n
                     self._dirty = True
                 def _load(self):
                     if self._loadfunc is not _noop:
                         lf, self._loadfunc = self._loadfunc, _noop
                         lf(self)
                     elif self._copyfunc is not _noop:
                         cf, self._copyfunc = self._copyfunc, _noop
                         cf(self)
                 def setflag(self, f, flags):
                     """Set the flags (symlink, executable) for path f."""
                     if flags not in _manifestflags:
                         raise TypeError(b"Invalid manifest flag set.")
                     self._load()
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._loadlazy(dir)
                         if dir not in self._dirs:
                             self._dirs[dir] = treemanifest(
                                 self.nodeconstants, self._subpath(dir)
                             )
                         self._dirs[dir].setflag(subpath, flags)
                     else:
                         self._flags[f] = flags
                     self._dirty = True
                 def copy(self):
                     copy = treemanifest(self.nodeconstants, self._dir)
                     copy._node = self._node
                     copy._dirty = self._dirty
                     if self._copyfunc is _noop:
                         def _copyfunc(s):
                             self._load()
                             s._lazydirs = {
                                 d: (n, r, True) for d, (n, r, c) in self._lazydirs.items()
                             }
                             sdirs = s._dirs
                             for d, v in self._dirs.items():
                                 sdirs[d] = v.copy()
                             s._files = dict.copy(self._files)
                             s._flags = dict.copy(self._flags)
                         if self._loadfunc is _noop:
                             _copyfunc(copy)
                         else:
                             copy._copyfunc = _copyfunc
                     else:
                         copy._copyfunc = self._copyfunc
                     return copy
                 def filesnotin(self, m2, match=None):
                     '''Set of files in this manifest that are not in the other'''
                     if match and not match.always():
                         m1 = self._matches(match)
                         m2 = m2._matches(match)
                         return m1.filesnotin(m2)
                     files = set()
                     def _filesnotin(t1, t2):
                         if t1._node == t2._node and not t1._dirty and not t2._dirty:
                             return
                         t1._load()
                         t2._load()
                         self._loaddifflazy(t1, t2)
                         for d, m1 in t1._dirs.items():
                             if d in t2._dirs:
                                 m2 = t2._dirs[d]
                                 _filesnotin(m1, m2)
                             else:
                                 files.update(m1.iterkeys())
                         for fn in t1._files:
                             if fn not in t2._files:
                                 files.add(t1._subpath(fn))
                     _filesnotin(self, m2)
                     return files
                 @propertycache
                 def _alldirs(self):
                     return pathutil.dirs(self)
                 def dirs(self):
                     return self._alldirs
                 def hasdir(self, dir):
                     self._load()
                     topdir, subdir = _splittopdir(dir)
                     if topdir:
                         self._loadlazy(topdir)
                         if topdir in self._dirs:
                             return self._dirs[topdir].hasdir(subdir)
                         return False
                     dirslash = dir + b'/'
                     return dirslash in self._dirs or dirslash in self._lazydirs
                 def walk(self, match):
                     """Generates matching file names.
                     It also reports nonexistent files by marking them bad with match.bad().
                     """
                     if match.always():
                         for f in iter(self):
                             yield f
                         return
                     fset = set(match.files())
                     for fn in self._walk(match):
                         if fn in fset:
                             # specified pattern is the exact name
                             fset.remove(fn)
                         yield fn
                     # for dirstate.walk, files=[''] means "walk the whole tree".
                     # follow that here, too
                     fset.discard(b'')
                     for fn in sorted(fset):
                         if not self.hasdir(fn):
                             match.bad(fn, None)
                 def _walk(self, match):
                     '''Recursively generates matching file names for walk().'''
                     visit = match.visitchildrenset(self._dir[:-1])
                     if not visit:
                         return
                     # yield this dir's files and walk its submanifests
                     self._load()
                     visit = self._loadchildrensetlazy(visit)
                     for p in sorted(list(self._dirs) + list(self._files)):
                         if p in self._files:
                             fullp = self._subpath(p)
                             if match(fullp):
                                 yield fullp
                         else:
                             if not visit or p[:-1] in visit:
                                 for f in self._dirs[p]._walk(match):
                                     yield f
                 def _matches(self, match):
                     """recursively generate a new manifest filtered by the match argument."""
                     if match.always():
                         return self.copy()
                     return self._matches_inner(match)
                 def _matches_inner(self, match):
                     if match.always():
                         return self.copy()
                     visit = match.visitchildrenset(self._dir[:-1])
                     if visit == b'all':
                         return self.copy()
                     ret = treemanifest(self.nodeconstants, self._dir)
                     if not visit:
                         return ret
                     self._load()
                     for fn in self._files:
                         # While visitchildrenset *usually* lists only subdirs, this is
                         # actually up to the matcher and may have some files in the set().
                         # If visit == 'this', we should obviously look at the files in this
                         # directory; if visit is a set, and fn is in it, we should inspect
                         # fn (but no need to inspect things not in the set).
                         if visit != b'this' and fn not in visit:
                             continue
                         fullp = self._subpath(fn)
                         # visitchildrenset isn't perfect, we still need to call the regular
                         # matcher code to further filter results.
                         if not match(fullp):
                             continue
                         ret._files[fn] = self._files[fn]
                         if fn in self._flags:
                             ret._flags[fn] = self._flags[fn]
                     visit = self._loadchildrensetlazy(visit)
                     for dir, subm in self._dirs.items():
                         if visit and dir[:-1] not in visit:
                             continue
                         m = subm._matches_inner(match)
                         if not m._isempty():
                             ret._dirs[dir] = m
                     if not ret._isempty():
                         ret._dirty = True
                     return ret
                 def fastdelta(self, base, changes):
                     raise FastdeltaUnavailable()
                 def diff(self, m2, match=None, clean=False):
                     """Finds changes between the current manifest and m2.
                     Args:
                       m2: the manifest to which this manifest should be compared.
                       clean: if true, include files unchanged between these manifests
                              with a None value in the returned dictionary.
                     The result is returned as a dict with filename as key and
                     values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
                     nodeid in the current/other manifest and fl1/fl2 is the flag
                     in the current/other manifest. Where the file does not exist,
                     the nodeid will be None and the flags will be the empty
                     string.
                     """
                     if match and not match.always():
                         m1 = self._matches(match)
                         m2 = m2._matches(match)
                         return m1.diff(m2, clean=clean)
                     result = {}
                     emptytree = treemanifest(self.nodeconstants)
                     def _iterativediff(t1, t2, stack):
                         """compares two tree manifests and append new tree-manifests which
                         needs to be compared to stack"""
                         if t1._node == t2._node and not t1._dirty and not t2._dirty:
                             return
                         t1._load()
                         t2._load()
                         self._loaddifflazy(t1, t2)
                         for d, m1 in t1._dirs.items():
                             m2 = t2._dirs.get(d, emptytree)
                             stack.append((m1, m2))
                         for d, m2 in t2._dirs.items():
                             if d not in t1._dirs:
                                 stack.append((emptytree, m2))
                         for fn, n1 in t1._files.items():
                             fl1 = t1._flags.get(fn, b'')
                             n2 = t2._files.get(fn, None)
                             fl2 = t2._flags.get(fn, b'')
                             if n1 != n2 or fl1 != fl2:
                                 result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))
                             elif clean:
                                 result[t1._subpath(fn)] = None
                         for fn, n2 in t2._files.items():
                             if fn not in t1._files:
                                 fl2 = t2._flags.get(fn, b'')
                                 result[t2._subpath(fn)] = ((None, b''), (n2, fl2))
                     stackls = []
                     _iterativediff(self, m2, stackls)
                     while stackls:
                         t1, t2 = stackls.pop()
                         # stackls is populated in the function call
                         _iterativediff(t1, t2, stackls)
                     return result
                 def unmodifiedsince(self, m2):
                     return not self._dirty and not m2._dirty and self._node == m2._node
                 def parse(self, text, readsubtree):
                     selflazy = self._lazydirs
                     for f, n, fl in _parse(self._nodelen, text):
                         if fl == b't':
                             f = f + b'/'
                             # False below means "doesn't need to be copied" and can use the
                             # cached value from readsubtree directly.
                             selflazy[f] = (n, readsubtree, False)
                         elif b'/' in f:
                             # This is a flat manifest, so use __setitem__ and setflag rather
                             # than assigning directly to _files and _flags, so we can
                             # assign a path in a subdirectory, and to mark dirty (compared
                             # to nullid).
                             self[f] = n
                             if fl:
                                 self.setflag(f, fl)
                         else:
                             # Assigning to _files and _flags avoids marking as dirty,
                             # and should be a little faster.
                             self._files[f] = n
                             if fl:
                                 self._flags[f] = fl
                 def text(self):
                     """Get the full data of this manifest as a bytestring."""
                     self._load()
                     return _text(self.iterentries())
                 def dirtext(self):
                     """Get the full data of this directory as a bytestring. Make sure that
                     any submanifests have been written first, so their nodeids are correct.
                     """
                     self._load()
                     flags = self.flags
                     lazydirs = [(d[:-1], v[0], b't') for d, v in self._lazydirs.items()]
                     dirs = [(d[:-1], self._dirs[d]._node, b't') for d in self._dirs]
                     files = [(f, self._files[f], flags(f)) for f in self._files]
                     return _text(sorted(dirs + files + lazydirs))
                 def read(self, gettext, readsubtree):
                     def _load_for_read(s):
                         s.parse(gettext(), readsubtree)
                         s._dirty = False
                     self._loadfunc = _load_for_read
                 def writesubtrees(self, m1, m2, writesubtree, match):
                     self._load()  # for consistency; should never have any effect here
                     m1._load()
                     m2._load()
                     emptytree = treemanifest(self.nodeconstants)
                     def getnode(m, d):
                         ld = m._lazydirs.get(d)
                         if ld:
                             return ld[0]
                         return m._dirs.get(d, emptytree)._node
                     # let's skip investigating things that `match` says we do not need.
                     visit = match.visitchildrenset(self._dir[:-1])
                     visit = self._loadchildrensetlazy(visit)
                     if visit == b'this' or visit == b'all':
                         visit = None
                     for d, subm in self._dirs.items():
                         if visit and d[:-1] not in visit:
                             continue
                         subp1 = getnode(m1, d)
                         subp2 = getnode(m2, d)
                         if subp1 == self.nodeconstants.nullid:
                             subp1, subp2 = subp2, subp1
                         writesubtree(subm, subp1, subp2, match)
                 def walksubtrees(self, matcher=None):
                     """Returns an iterator of the subtrees of this manifest, including this
                     manifest itself.
                     If `matcher` is provided, it only returns subtrees that match.
                     """
                     if matcher and not matcher.visitdir(self._dir[:-1]):
                         return
                     if not matcher or matcher(self._dir[:-1]):
                         yield self
                     self._load()
                     # OPT: use visitchildrenset to avoid loading everything.
                     self._loadalllazy()
                     for d, subm in self._dirs.items():
                         for subtree in subm.walksubtrees(matcher=matcher):
                             yield subtree
             class manifestfulltextcache(util.lrucachedict):
                 """File-backed LRU cache for the manifest cache
                 File consists of entries, up to EOF:
                 - 20 bytes node, 4 bytes length, <length> manifest data
                 These are written in reverse cache order (oldest to newest).
                 """
                 _file = b'manifestfulltextcache'
                 def __init__(self, max):
                     super(manifestfulltextcache, self).__init__(max)
                     self._dirty = False
                     self._read = False
                     self._opener = None
                 def read(self):
                     if self._read or self._opener is None:
                         return
                     try:
                         with self._opener(self._file) as fp:
                             set = super(manifestfulltextcache, self).__setitem__
                             # ignore trailing data, this is a cache, corruption is skipped
                             while True:
                                 # TODO do we need to do work here for sha1 portability?
                                 node = fp.read(20)
                                 if len(node) < 20:
                                     break
                                 try:
                                     size = struct.unpack(b'>L', fp.read(4))[0]
                                 except struct.error:
                                     break
                                 value = bytearray(fp.read(size))
                                 if len(value) != size:
                                     break
                                 set(node, value)
                     except IOError:
                         # the file is allowed to be missing
                         pass
                     self._read = True
                     self._dirty = False
                 def write(self):
                     if not self._dirty or self._opener is None:
                         return
                     # rotate backwards to the first used node
                     try:
                         with self._opener(
                             self._file, b'w', atomictemp=True, checkambig=True
                         ) as fp:
                             node = self._head.prev
                             while True:
                                 if node.key in self._cache:
                                     fp.write(node.key)
                                     fp.write(struct.pack(b'>L', len(node.value)))
                                     fp.write(node.value)
                                 if node is self._head:
                                     break
                                 node = node.prev
                     except IOError:
                         # We could not write the cache (eg: permission error)
                         # the content can be missing.
                         #
                         # We could try harder and see if we could recreate a wcache
                         # directory were we coudl write too.
                         #
                         # XXX the error pass silently, having some way to issue an error
                         # log `ui.log` would be nice.
                         pass
                 def __len__(self):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).__len__()
                 def __contains__(self, k):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).__contains__(k)
                 def __iter__(self):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).__iter__()
                 def __getitem__(self, k):
                     if not self._read:
                         self.read()
                     # the cache lru order can change on read
                     setdirty = self._cache.get(k) is not self._head
                     value = super(manifestfulltextcache, self).__getitem__(k)
                     if setdirty:
                         self._dirty = True
                     return value
                 def __setitem__(self, k, v):
                     if not self._read:
                         self.read()
                     super(manifestfulltextcache, self).__setitem__(k, v)
                     self._dirty = True
                 def __delitem__(self, k):
                     if not self._read:
                         self.read()
                     super(manifestfulltextcache, self).__delitem__(k)
                     self._dirty = True
                 def get(self, k, default=None):
                     if not self._read:
                         self.read()
                     return super(manifestfulltextcache, self).get(k, default=default)
                 def clear(self, clear_persisted_data=False):
                     super(manifestfulltextcache, self).clear()
                     if clear_persisted_data:
                         self._dirty = True
                         self.write()
                     self._read = False
             # and upper bound of what we expect from compression
             # (real live value seems to be "3")
             MAXCOMPRESSION = 3
             class FastdeltaUnavailable(Exception):
                 """Exception raised when fastdelta isn't usable on a manifest."""
             @interfaceutil.implementer(repository.imanifeststorage)
             class manifestrevlog:
                 """A revlog that stores manifest texts. This is responsible for caching the
                 full-text manifest contents.
                 """
                 def __init__(
                     self,
                     nodeconstants,
                     opener,
                     tree=b'',
                     dirlogcache=None,
                     treemanifest=False,
                 ):
                     """Constructs a new manifest revlog
                     `indexfile` - used by extensions to have two manifests at once, like
                     when transitioning between flatmanifeset and treemanifests.
                     `treemanifest` - used to indicate this is a tree manifest revlog. Opener
                     options can also be used to make this a tree manifest revlog. The opener
                     option takes precedence, so if it is set to True, we ignore whatever
                     value is passed in to the constructor.
                     """
                     self.nodeconstants = nodeconstants
                     # During normal operations, we expect to deal with not more than four
                     # revs at a time (such as during commit --amend). When rebasing large
                     # stacks of commits, the number can go up, hence the config knob below.
                     cachesize = 4
                     optiontreemanifest = False
                     opts = getattr(opener, 'options', None)
                     if opts is not None:
                         cachesize = opts.get(b'manifestcachesize', cachesize)
                         optiontreemanifest = opts.get(b'treemanifest', False)
                     self._treeondisk = optiontreemanifest or treemanifest
                     self._fulltextcache = manifestfulltextcache(cachesize)
                     if tree:
                         assert self._treeondisk, (tree, b'opts is %r' % opts)
                     radix = b'00manifest'
                     if tree:
                         radix = b"meta/" + tree + radix
                     self.tree = tree
                     # The dirlogcache is kept on the root manifest log
                     if tree:
                         self._dirlogcache = dirlogcache
                     else:
                         self._dirlogcache = {b'': self}
                     self._revlog = revlog.revlog(
                         opener,
                         target=(revlog_constants.KIND_MANIFESTLOG, self.tree),
                         radix=radix,
                         # only root indexfile is cached
                         checkambig=not bool(tree),
                         mmaplargeindex=True,
                         upperboundcomp=MAXCOMPRESSION,
                         persistentnodemap=opener.options.get(b'persistent-nodemap', False),
                     )
                     self.index = self._revlog.index
                 def get_revlog(self):
                     """return an actual revlog instance if any
                     This exist because a lot of code leverage the fact the underlying
                     storage is a revlog for optimization, so giving simple way to access
                     the revlog instance helps such code.
                     """
                     return self._revlog
                 def _setupmanifestcachehooks(self, repo):
                     """Persist the manifestfulltextcache on lock release"""
                     if not hasattr(repo, '_wlockref'):
                         return
                     self._fulltextcache._opener = repo.wcachevfs
                     if repo._currentlock(repo._wlockref) is None:
                         return
                     reporef = weakref.ref(repo)
                     manifestrevlogref = weakref.ref(self)
                     def persistmanifestcache(success):
                         # Repo is in an unknown state, do not persist.
                         if not success:
                             return
                         repo = reporef()
                         self = manifestrevlogref()
                         if repo is None or self is None:
                             return
                         if repo.manifestlog.getstorage(b'') is not self:
                             # there's a different manifest in play now, abort
                             return
                         self._fulltextcache.write()
                     repo._afterlock(persistmanifestcache)
                 @property
                 def fulltextcache(self):
                     return self._fulltextcache
                 def clearcaches(self, clear_persisted_data=False):
                     self._revlog.clearcaches()
                     self._fulltextcache.clear(clear_persisted_data=clear_persisted_data)
                     self._dirlogcache = {self.tree: self}
                 def dirlog(self, d):
                     if d:
                         assert self._treeondisk
                     if d not in self._dirlogcache:
                         mfrevlog = manifestrevlog(
                             self.nodeconstants,
                             self.opener,
                             d,
                             self._dirlogcache,
                             treemanifest=self._treeondisk,
                         )
                         self._dirlogcache[d] = mfrevlog
                     return self._dirlogcache[d]
                 def add(
                     self,
                     m,
                     transaction,
                     link,
                     p1,
                     p2,
                     added,
                     removed,
                     readtree=None,
                     match=None,
                 ):
                     """add some manifest entry in to the manifest log
                     input:
                       m:           the manifest dict we want to store
                       transaction: the open transaction
                       p1:          manifest-node of p1
                       p2:          manifest-node of p2
                       added:       file added/changed compared to parent
                       removed:     file removed compared to parent
                     tree manifest input:
                       readtree:    a function to read a subtree
                       match:       a filematcher for the subpart of the tree manifest
                     """
                     try:
                         if p1 not in self.fulltextcache:
                             raise FastdeltaUnavailable()
                         # If our first parent is in the manifest cache, we can
                         # compute a delta here using properties we know about the
                         # manifest up-front, which may save time later for the
                         # revlog layer.
                         _checkforbidden(added)
                         # combine the changed lists into one sorted iterator
                         work = heapq.merge(
                             [(x, False) for x in sorted(added)],
                             [(x, True) for x in sorted(removed)],
                         )
                         arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)
                         cachedelta = self._revlog.rev(p1), deltatext
                         text = util.buffer(arraytext)
                         rev = self._revlog.addrevision(
                             text, transaction, link, p1, p2, cachedelta
                         )
                         n = self._revlog.node(rev)
                     except FastdeltaUnavailable:
                         # The first parent manifest isn't already loaded or the
                         # manifest implementation doesn't support fastdelta, so
                         # we'll just encode a fulltext of the manifest and pass
                         # that through to the revlog layer, and let it handle the
                         # delta process.
                         if self._treeondisk:
                             assert readtree, b"readtree must be set for treemanifest writes"
                             assert match, b"match must be specified for treemanifest writes"
                             m1 = readtree(self.tree, p1)
                             m2 = readtree(self.tree, p2)
                             n = self._addtree(
                                 m, transaction, link, m1, m2, readtree, match=match
                             )
                             arraytext = None
                         else:
                             text = m.text()
                             rev = self._revlog.addrevision(text, transaction, link, p1, p2)
                             n = self._revlog.node(rev)
                             arraytext = bytearray(text)
                     if arraytext is not None:
                         self.fulltextcache[n] = arraytext
                     return n
                 def _addtree(self, m, transaction, link, m1, m2, readtree, match):
                     # If the manifest is unchanged compared to one parent,
                     # don't write a new revision
                     if self.tree != b'' and (
                         m.unmodifiedsince(m1) or m.unmodifiedsince(m2)
                     ):
                         return m.node()
                     def writesubtree(subm, subp1, subp2, match):
                         sublog = self.dirlog(subm.dir())
                         sublog.add(
                             subm,
                             transaction,
                             link,
                             subp1,
                             subp2,
                             None,
                             None,
                             readtree=readtree,
                             match=match,
                         )
                     m.writesubtrees(m1, m2, writesubtree, match)
                     text = m.dirtext()
                     n = None
                     if self.tree != b'':
                         # Double-check whether contents are unchanged to one parent
                         if text == m1.dirtext():
                             n = m1.node()
                         elif text == m2.dirtext():
                             n = m2.node()
                     if not n:
                         rev = self._revlog.addrevision(
                             text, transaction, link, m1.node(), m2.node()
                         )
                         n = self._revlog.node(rev)
                     # Save nodeid so parent manifest can calculate its nodeid
                     m.setnode(n)
                     return n
                 def __len__(self):
                     return len(self._revlog)
                 def __iter__(self):
                     return self._revlog.__iter__()
                 def rev(self, node):
                     return self._revlog.rev(node)
                 def node(self, rev):
                     return self._revlog.node(rev)
                 def lookup(self, value):
                     return self._revlog.lookup(value)
                 def parentrevs(self, rev):
                     return self._revlog.parentrevs(rev)
                 def parents(self, node):
                     return self._revlog.parents(node)
                 def linkrev(self, rev):
                     return self._revlog.linkrev(rev)
                 def checksize(self):
                     return self._revlog.checksize()
                 def revision(self, node):
                     return self._revlog.revision(node)
                 def rawdata(self, node):
                     return self._revlog.rawdata(node)
                 def revdiff(self, rev1, rev2):
                     return self._revlog.revdiff(rev1, rev2)
                 def cmp(self, node, text):
                     return self._revlog.cmp(node, text)
                 def deltaparent(self, rev):
                     return self._revlog.deltaparent(rev)
                 def emitrevisions(
                     self,
                     nodes,
                     nodesorder=None,
                     revisiondata=False,
                     assumehaveparentrevisions=False,
                     deltamode=repository.CG_DELTAMODE_STD,
                     sidedata_helpers=None,
                     debug_info=None,
                 ):
                     return self._revlog.emitrevisions(
                         nodes,
                         nodesorder=nodesorder,
                         revisiondata=revisiondata,
                         assumehaveparentrevisions=assumehaveparentrevisions,
                         deltamode=deltamode,
                         sidedata_helpers=sidedata_helpers,
                         debug_info=debug_info,
                     )
                 def addgroup(
                     self,
                     deltas,
                     linkmapper,
                     transaction,
                     alwayscache=False,
                     addrevisioncb=None,
                     duplicaterevisioncb=None,
                     debug_info=None,
                     delta_base_reuse_policy=None,
                 ):
                     return self._revlog.addgroup(
                         deltas,
                         linkmapper,
                         transaction,
                         alwayscache=alwayscache,
                         addrevisioncb=addrevisioncb,
                         duplicaterevisioncb=duplicaterevisioncb,
                         debug_info=debug_info,
                         delta_base_reuse_policy=delta_base_reuse_policy,
                     )
                 def rawsize(self, rev):
                     return self._revlog.rawsize(rev)
                 def getstrippoint(self, minlink):
                     return self._revlog.getstrippoint(minlink)
                 def strip(self, minlink, transaction):
                     return self._revlog.strip(minlink, transaction)
                 def files(self):
                     return self._revlog.files()
                 def clone(self, tr, destrevlog, **kwargs):
                     if not isinstance(destrevlog, manifestrevlog):
                         raise error.ProgrammingError(b'expected manifestrevlog to clone()')
                     return self._revlog.clone(tr, destrevlog._revlog, **kwargs)
                 def storageinfo(
                     self,
                     exclusivefiles=False,
                     sharedfiles=False,
                     revisionscount=False,
                     trackedsize=False,
                     storedsize=False,
                 ):
                     return self._revlog.storageinfo(
                         exclusivefiles=exclusivefiles,
                         sharedfiles=sharedfiles,
                         revisionscount=revisionscount,
                         trackedsize=trackedsize,
                         storedsize=storedsize,
                     )
                 @property
                 def opener(self):
                     return self._revlog.opener
                 @opener.setter
                 def opener(self, value):
                     self._revlog.opener = value
             @interfaceutil.implementer(repository.imanifestlog)
             class manifestlog:
                 """A collection class representing the collection of manifest snapshots
                 referenced by commits in the repository.
                 In this situation, 'manifest' refers to the abstract concept of a snapshot
                 of the list of files in the given commit. Consumers of the output of this
                 class do not care about the implementation details of the actual manifests
                 they receive (i.e. tree or flat or lazily loaded, etc)."""
                 def __init__(self, opener, repo, rootstore, narrowmatch):
                     self.nodeconstants = repo.nodeconstants
                     usetreemanifest = False
                     cachesize = 4
                     opts = getattr(opener, 'options', None)
                     if opts is not None:
                         usetreemanifest = opts.get(b'treemanifest', usetreemanifest)
                         cachesize = opts.get(b'manifestcachesize', cachesize)
                     self._treemanifests = usetreemanifest
                     self._rootstore = rootstore
                     self._rootstore._setupmanifestcachehooks(repo)
                     self._narrowmatch = narrowmatch
                     # A cache of the manifestctx or treemanifestctx for each directory
                     self._dirmancache = {}
                     self._dirmancache[b''] = util.lrucachedict(cachesize)
                     self._cachesize = cachesize
                 def __getitem__(self, node):
                     """Retrieves the manifest instance for the given node. Throws a
                     LookupError if not found.
                     """
                     return self.get(b'', node)
                 def get(self, tree, node, verify=True):
                     """Retrieves the manifest instance for the given node. Throws a
                     LookupError if not found.
                     `verify` - if True an exception will be thrown if the node is not in
                                the revlog
                     """
                     if node in self._dirmancache.get(tree, ()):
                         return self._dirmancache[tree][node]
                     if not self._narrowmatch.always():
                         if not self._narrowmatch.visitdir(tree[:-1]):
                             return excludeddirmanifestctx(self.nodeconstants, tree, node)
                     if tree:
                         if self._rootstore._treeondisk:
                             if verify:
                                 # Side-effect is LookupError is raised if node doesn't
                                 # exist.
                                 self.getstorage(tree).rev(node)
                             m = treemanifestctx(self, tree, node)
                         else:
                             raise error.Abort(
                                 _(
                                     b"cannot ask for manifest directory '%s' in a flat "
                                     b"manifest"
                                 )
                                 % tree
                             )
                     else:
                         if verify:
                             # Side-effect is LookupError is raised if node doesn't exist.
                             self._rootstore.rev(node)
                         if self._treemanifests:
                             m = treemanifestctx(self, b'', node)
                         else:
                             m = manifestctx(self, node)
                     if node != self.nodeconstants.nullid:
                         mancache = self._dirmancache.get(tree)
                         if not mancache:
                             mancache = util.lrucachedict(self._cachesize)
                             self._dirmancache[tree] = mancache
                         mancache[node] = m
                     return m
                 def getstorage(self, tree):
                     return self._rootstore.dirlog(tree)
                 def clearcaches(self, clear_persisted_data=False):
                     self._dirmancache.clear()
                     self._rootstore.clearcaches(clear_persisted_data=clear_persisted_data)
                 def rev(self, node):
                     return self._rootstore.rev(node)
                 def update_caches(self, transaction):
                     return self._rootstore._revlog.update_caches(transaction=transaction)
             @interfaceutil.implementer(repository.imanifestrevisionwritable)
             class memmanifestctx:
                 def __init__(self, manifestlog):
                     self._manifestlog = manifestlog
                     self._manifestdict = manifestdict(manifestlog.nodeconstants.nodelen)
                 def _storage(self):
                     return self._manifestlog.getstorage(b'')
                 def copy(self):
                     memmf = memmanifestctx(self._manifestlog)
                     memmf._manifestdict = self.read().copy()
                     return memmf
                 def read(self):
                     return self._manifestdict
                 def write(self, transaction, link, p1, p2, added, removed, match=None):
                     return self._storage().add(
                         self._manifestdict,
                         transaction,
                         link,
                         p1,
                         p2,
                         added,
                         removed,
                         match=match,
                     )
             @interfaceutil.implementer(repository.imanifestrevisionstored)
             class manifestctx:
                 """A class representing a single revision of a manifest, including its
                 contents, its parent revs, and its linkrev.
                 """
                 def __init__(self, manifestlog, node):
                     self._manifestlog = manifestlog
                     self._data = None
                     self._node = node
                     # TODO: We eventually want p1, p2, and linkrev exposed on this class,
                     # but let's add it later when something needs it and we can load it
                     # lazily.
                     # self.p1, self.p2 = store.parents(node)
                     # rev = store.rev(node)
                     # self.linkrev = store.linkrev(rev)
                 def _storage(self):
                     return self._manifestlog.getstorage(b'')
                 def node(self):
                     return self._node
                 def copy(self):
                     memmf = memmanifestctx(self._manifestlog)
                     memmf._manifestdict = self.read().copy()
                     return memmf
                 @propertycache
                 def parents(self):
                     return self._storage().parents(self._node)
                 def read(self):
                     if self._data is None:
                         nc = self._manifestlog.nodeconstants
                         if self._node == nc.nullid:
                             self._data = manifestdict(nc.nodelen)
                         else:
                             store = self._storage()
                             if self._node in store.fulltextcache:
                                 text = pycompat.bytestr(store.fulltextcache[self._node])
                             else:
                                 text = store.revision(self._node)
                                 arraytext = bytearray(text)
                                 store.fulltextcache[self._node] = arraytext
                             self._data = manifestdict(nc.nodelen, text)
                     return self._data
                 def readfast(self, shallow=False):
                     """Calls either readdelta or read, based on which would be less work.
                     readdelta is called if the delta is against the p1, and therefore can be
                     read quickly.
                     If `shallow` is True, nothing changes since this is a flat manifest.
                     """
                     store = self._storage()
                     r = store.rev(self._node)
                     deltaparent = store.deltaparent(r)
                     if deltaparent != nullrev and deltaparent in store.parentrevs(r):
                         return self.readdelta()
                     return self.read()
                 def readdelta(self, shallow=False):
                     """Returns a manifest containing just the entries that are present
                     in this manifest, but not in its p1 manifest. This is efficient to read
                     if the revlog delta is already p1.
                     Changing the value of `shallow` has no effect on flat manifests.
                     """
                     store = self._storage()
                     r = store.rev(self._node)
                     d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))
                     return manifestdict(store.nodeconstants.nodelen, d)
                 def find(self, key):
                     return self.read().find(key)
             @interfaceutil.implementer(repository.imanifestrevisionwritable)
             class memtreemanifestctx:
                 def __init__(self, manifestlog, dir=b''):
                     self._manifestlog = manifestlog
                     self._dir = dir
                     self._treemanifest = treemanifest(manifestlog.nodeconstants)
                 def _storage(self):
                     return self._manifestlog.getstorage(b'')
                 def copy(self):
                     memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)
                     memmf._treemanifest = self._treemanifest.copy()
                     return memmf
                 def read(self):
                     return self._treemanifest
                 def write(self, transaction, link, p1, p2, added, removed, match=None):
                     def readtree(dir, node):
                         return self._manifestlog.get(dir, node).read()
                     return self._storage().add(
                         self._treemanifest,
                         transaction,
                         link,
                         p1,
                         p2,
                         added,
                         removed,
                         readtree=readtree,
                         match=match,
                     )
             @interfaceutil.implementer(repository.imanifestrevisionstored)
             class treemanifestctx:
                 def __init__(self, manifestlog, dir, node):
                     self._manifestlog = manifestlog
                     self._dir = dir
                     self._data = None
                     self._node = node
                     # TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that
                     # we can instantiate treemanifestctx objects for directories we don't
                     # have on disk.
                     # self.p1, self.p2 = store.parents(node)
                     # rev = store.rev(node)
                     # self.linkrev = store.linkrev(rev)
                 def _storage(self):
                     narrowmatch = self._manifestlog._narrowmatch
                     if not narrowmatch.always():
                         if not narrowmatch.visitdir(self._dir[:-1]):
                             return excludedmanifestrevlog(
                                 self._manifestlog.nodeconstants, self._dir
                             )
                     return self._manifestlog.getstorage(self._dir)
                 def read(self):
                     if self._data is None:
                         store = self._storage()
                         if self._node == self._manifestlog.nodeconstants.nullid:
                             self._data = treemanifest(self._manifestlog.nodeconstants)
                         # TODO accessing non-public API
                         elif store._treeondisk:
                             m = treemanifest(self._manifestlog.nodeconstants, dir=self._dir)
                             def gettext():
                                 return store.revision(self._node)
                             def readsubtree(dir, subm):
                                 # Set verify to False since we need to be able to create
                                 # subtrees for trees that don't exist on disk.
                                 return self._manifestlog.get(dir, subm, verify=False).read()
                             m.read(gettext, readsubtree)
                             m.setnode(self._node)
                             self._data = m
                         else:
                             if self._node in store.fulltextcache:
                                 text = pycompat.bytestr(store.fulltextcache[self._node])
                             else:
                                 text = store.revision(self._node)
                                 arraytext = bytearray(text)
                                 store.fulltextcache[self._node] = arraytext
                             self._data = treemanifest(
                                 self._manifestlog.nodeconstants, dir=self._dir, text=text
                             )
                     return self._data
                 def node(self):
                     return self._node
                 def copy(self):
                     memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)
                     memmf._treemanifest = self.read().copy()
                     return memmf
                 @propertycache
                 def parents(self):
                     return self._storage().parents(self._node)
                 def readdelta(self, shallow=False):
                     """Returns a manifest containing just the entries that are present
                     in this manifest, but not in its p1 manifest. This is efficient to read
                     if the revlog delta is already p1.
                     If `shallow` is True, this will read the delta for this directory,
                     without recursively reading subdirectory manifests. Instead, any
                     subdirectory entry will be reported as it appears in the manifest, i.e.
                     the subdirectory will be reported among files and distinguished only by
                     its 't' flag.
                     """
                     store = self._storage()
                     if shallow:
                         r = store.rev(self._node)
                         d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))
                         return manifestdict(store.nodeconstants.nodelen, d)
                     else:
                         # Need to perform a slow delta
                         r0 = store.deltaparent(store.rev(self._node))
                         m0 = self._manifestlog.get(self._dir, store.node(r0)).read()
                         m1 = self.read()
                         md = treemanifest(self._manifestlog.nodeconstants, dir=self._dir)
                         for f, ((n0, fl0), (n1, fl1)) in m0.diff(m1).items():
                             if n1:
                                 md[f] = n1
                                 if fl1:
                                     md.setflag(f, fl1)
                         return md
                 def readfast(self, shallow=False):
                     """Calls either readdelta or read, based on which would be less work.
                     readdelta is called if the delta is against the p1, and therefore can be
                     read quickly.
                     If `shallow` is True, it only returns the entries from this manifest,
                     and not any submanifests.
                     """
                     store = self._storage()
                     r = store.rev(self._node)
                     deltaparent = store.deltaparent(r)
                     if deltaparent != nullrev and deltaparent in store.parentrevs(r):
                         return self.readdelta(shallow=shallow)
                     if shallow:
                         return manifestdict(
                             store.nodeconstants.nodelen, store.revision(self._node)
                         )
                     else:
                         return self.read()
                 def find(self, key):
                     return self.read().find(key)
             class excludeddir(treemanifest):
                 """Stand-in for a directory that is excluded from the repository.
                 With narrowing active on a repository that uses treemanifests,
                 some of the directory revlogs will be excluded from the resulting
                 clone. This is a huge storage win for clients, but means we need
                 some sort of pseudo-manifest to surface to internals so we can
                 detect a merge conflict outside the narrowspec. That's what this
                 class is: it stands in for a directory whose node is known, but
                 whose contents are unknown.
                 """
                 def __init__(self, nodeconstants, dir, node):
                     super(excludeddir, self).__init__(nodeconstants, dir)
                     self._node = node
                     # Add an empty file, which will be included by iterators and such,
                     # appearing as the directory itself (i.e. something like "dir/")
                     self._files[b''] = node
                     self._flags[b''] = b't'
                 # Manifests outside the narrowspec should never be modified, so avoid
                 # copying. This makes a noticeable difference when there are very many
                 # directories outside the narrowspec. Also, it makes sense for the copy to
                 # be of the same type as the original, which would not happen with the
                 # super type's copy().
                 def copy(self):
                     return self
             class excludeddirmanifestctx(treemanifestctx):
                 """context wrapper for excludeddir - see that docstring for rationale"""
                 def __init__(self, nodeconstants, dir, node):
                     self.nodeconstants = nodeconstants
                     self._dir = dir
                     self._node = node
                 def read(self):
                     return excludeddir(self.nodeconstants, self._dir, self._node)
                 def readfast(self, shallow=False):
                     # special version of readfast since we don't have underlying storage
                     return self.read()
                 def write(self, *args):
                     raise error.ProgrammingError(
                         b'attempt to write manifest from excluded dir %s' % self._dir
                     )
             class excludedmanifestrevlog(manifestrevlog):
                 """Stand-in for excluded treemanifest revlogs.
                 When narrowing is active on a treemanifest repository, we'll have
                 references to directories we can't see due to the revlog being
                 skipped. This class exists to conform to the manifestrevlog
                 interface for those directories and proactively prevent writes to
                 outside the narrowspec.
                 """
                 def __init__(self, nodeconstants, dir):
                     self.nodeconstants = nodeconstants
                     self._dir = dir
                 def __len__(self):
                     raise error.ProgrammingError(
                         b'attempt to get length of excluded dir %s' % self._dir
                     )
                 def rev(self, node):
                     raise error.ProgrammingError(
                         b'attempt to get rev from excluded dir %s' % self._dir
                     )
                 def linkrev(self, node):
                     raise error.ProgrammingError(
                         b'attempt to get linkrev from excluded dir %s' % self._dir
                     )
                 def node(self, rev):
                     raise error.ProgrammingError(
                         b'attempt to get node from excluded dir %s' % self._dir
                     )
                 def add(self, *args, **kwargs):
                     # We should never write entries in dirlogs outside the narrow clone.
                     # However, the method still gets called from writesubtree() in
                     # _addtree(), so we need to handle it. We should possibly make that
                     # avoid calling add() with a clean manifest (_dirty is always False
                     # in excludeddir instances).
                     pass