upstream/mercurial-mirror Commit - r48740:411dc27f

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

"""Storage back-end for Mercurial.

8

"""Storage back-end for Mercurial.

9

10

This provides efficient delta storage with O(1) retrieve and append

10

This provides efficient delta storage with O(1) retrieve and append

11

and O(changes) merge between branches.

11

and O(changes) merge between branches.

12

"""

12

"""

13

14

from __future__ import absolute_import

14

from __future__ import absolute_import

15

16

import binascii

16

import binascii

17

import collections

17

import collections

18

import contextlib

18

import contextlib

19

import errno

19

import errno

20

import io

20

import io

21

import os

21

import os

22

import struct

22

import struct

23

import zlib

23

import zlib

24

25

# import stuff from node for others to import from revlog

25

# import stuff from node for others to import from revlog

26

from .node import (

26

from .node import (

27

bin,

27

bin,

28

hex,

28

hex,

29

nullhex,

29

nullhex,

30

nullid,

30

nullid,

31

nullrev,

31

nullrev,

32

sha1nodeconstants,

32

sha1nodeconstants,

33

short,

33

short,

34

wdirfilenodeids,

34

wdirfilenodeids,

35

wdirhex,

35

wdirhex,

36

wdirid,

36

wdirid,

37

wdirrev,

37

wdirrev,

38

)

38

)

39

from .i18n import _

39

from .i18n import _

40

from .pycompat import getattr

40

from .pycompat import getattr

41

from .revlogutils.constants import (

41

from .revlogutils.constants import (

42

FLAG_GENERALDELTA,

42

FLAG_GENERALDELTA,

43

FLAG_INLINE_DATA,

43

FLAG_INLINE_DATA,

44

INDEX_ENTRY_V0,

44

INDEX_ENTRY_V0,

45

INDEX_ENTRY_V1,

45

INDEX_ENTRY_V1,

46

INDEX_ENTRY_V2,

46

INDEX_ENTRY_V2,

47

INDEX_HEADER,

47

INDEX_HEADER,

48

REVLOGV0,

48

REVLOGV0,

49

REVLOGV1,

49

REVLOGV1,

50

REVLOGV1_FLAGS,

50

REVLOGV1_FLAGS,

51

REVLOGV2,

51

REVLOGV2,

52

REVLOGV2_FLAGS,

52

REVLOGV2_FLAGS,

53

REVLOG_DEFAULT_FLAGS,

53

REVLOG_DEFAULT_FLAGS,

54

REVLOG_DEFAULT_FORMAT,

54

REVLOG_DEFAULT_FORMAT,

55

REVLOG_DEFAULT_VERSION,

55

REVLOG_DEFAULT_VERSION,

56

)

56

)

57

from .revlogutils.flagutil import (

57

from .revlogutils.flagutil import (

58

REVIDX_DEFAULT_FLAGS,

58

REVIDX_DEFAULT_FLAGS,

59

REVIDX_ELLIPSIS,

59

REVIDX_ELLIPSIS,

60

REVIDX_EXTSTORED,

60

REVIDX_EXTSTORED,

61

REVIDX_FLAGS_ORDER,

61

REVIDX_FLAGS_ORDER,

62

REVIDX_HASCOPIESINFO,

62

REVIDX_HASCOPIESINFO,

63

REVIDX_ISCENSORED,

63

REVIDX_ISCENSORED,

64

REVIDX_RAWTEXT_CHANGING_FLAGS,

64

REVIDX_RAWTEXT_CHANGING_FLAGS,

65

REVIDX_SIDEDATA,

65

REVIDX_SIDEDATA,

66

)

66

)

67

from .thirdparty import attr

67

from .thirdparty import attr

68

from . import (

68

from . import (

69

ancestor,

69

ancestor,

70

dagop,

70

dagop,

71

error,

71

error,

72

mdiff,

72

mdiff,

73

policy,

73

policy,

74

pycompat,

74

pycompat,

75

templatefilters,

75

templatefilters,

76

util,

76

util,

77

)

77

)

78

from .interfaces import (

78

from .interfaces import (

79

repository,

79

repository,

80

util as interfaceutil,

80

util as interfaceutil,

81

)

81

)

82

from .revlogutils import (

82

from .revlogutils import (

83

deltas as deltautil,

83

deltas as deltautil,

84

flagutil,

84

flagutil,

85

nodemap as nodemaputil,

85

nodemap as nodemaputil,

86

sidedata as sidedatautil,

86

sidedata as sidedatautil,

87

)

87

)

88

from .utils import (

88

from .utils import (

89

storageutil,

89

storageutil,

90

stringutil,

90

stringutil,

91

)

91

)

92

93

# blanked usage of all the name to prevent pyflakes constraints

93

# blanked usage of all the name to prevent pyflakes constraints

94

# We need these name available in the module for extensions.

94

# We need these name available in the module for extensions.

95

REVLOGV0

95

REVLOGV0

96

REVLOGV1

96

REVLOGV1

97

REVLOGV2

97

REVLOGV2

98

FLAG_INLINE_DATA

98

FLAG_INLINE_DATA

99

FLAG_GENERALDELTA

99

FLAG_GENERALDELTA

100

REVLOG_DEFAULT_FLAGS

100

REVLOG_DEFAULT_FLAGS

101

REVLOG_DEFAULT_FORMAT

101

REVLOG_DEFAULT_FORMAT

102

REVLOG_DEFAULT_VERSION

102

REVLOG_DEFAULT_VERSION

103

REVLOGV1_FLAGS

103

REVLOGV1_FLAGS

104

REVLOGV2_FLAGS

104

REVLOGV2_FLAGS

105

REVIDX_ISCENSORED

105

REVIDX_ISCENSORED

106

REVIDX_ELLIPSIS

106

REVIDX_ELLIPSIS

107

REVIDX_SIDEDATA

107

REVIDX_SIDEDATA

108

REVIDX_HASCOPIESINFO

108

REVIDX_HASCOPIESINFO

109

REVIDX_EXTSTORED

109

REVIDX_EXTSTORED

110

REVIDX_DEFAULT_FLAGS

110

REVIDX_DEFAULT_FLAGS

111

REVIDX_FLAGS_ORDER

111

REVIDX_FLAGS_ORDER

112

REVIDX_RAWTEXT_CHANGING_FLAGS

112

REVIDX_RAWTEXT_CHANGING_FLAGS

113

114

parsers = policy.importmod('parsers')

114

parsers = policy.importmod('parsers')

115

rustancestor = policy.importrust('ancestor')

115

rustancestor = policy.importrust('ancestor')

116

rustdagop = policy.importrust('dagop')

116

rustdagop = policy.importrust('dagop')

117

rustrevlog = policy.importrust('revlog')

117

rustrevlog = policy.importrust('revlog')

118

119

# Aliased for performance.

119

# Aliased for performance.

120

_zlibdecompress = zlib.decompress

120

_zlibdecompress = zlib.decompress

121

122

# max size of revlog with inline data

122

# max size of revlog with inline data

123

_maxinline = 131072

123

_maxinline = 131072

124

_chunksize = 1048576

124

_chunksize = 1048576

125

126

# Flag processors for REVIDX_ELLIPSIS.

126

# Flag processors for REVIDX_ELLIPSIS.

127

def ellipsisreadprocessor(rl, text):

127

def ellipsisreadprocessor(rl, text):

128

return text, False

128

return text, False

129

130

131

def ellipsiswriteprocessor(rl, text):

131

def ellipsiswriteprocessor(rl, text):

132

return text, False

132

return text, False

133

134

135

def ellipsisrawprocessor(rl, text):

135

def ellipsisrawprocessor(rl, text):

136

return False

136

return False

137

138

139

ellipsisprocessor = (

139

ellipsisprocessor = (

140

ellipsisreadprocessor,

140

ellipsisreadprocessor,

141

ellipsiswriteprocessor,

141

ellipsiswriteprocessor,

142

ellipsisrawprocessor,

142

ellipsisrawprocessor,

143

)

143

)

144

145

146

def getoffset(q):

146

def getoffset(q):

147

return int(q >> 16)

147

return int(q >> 16)

148

149

150

def gettype(q):

150

def gettype(q):

151

return int(q & 0xFFFF)

151

return int(q & 0xFFFF)

152

153

154

def offset_type(offset, type):

154

def offset_type(offset, type):

155

if (type & ~flagutil.REVIDX_KNOWN_FLAGS) != 0:

155

if (type & ~flagutil.REVIDX_KNOWN_FLAGS) != 0:

156

raise ValueError(b'unknown revlog index flags')

156

raise ValueError(b'unknown revlog index flags')

157

return int(int(offset) << 16 | type)

157

return int(int(offset) << 16 | type)

158

159

160

def _verify_revision(rl, skipflags, state, node):

160

def _verify_revision(rl, skipflags, state, node):

161

"""Verify the integrity of the given revlog ``node`` while providing a hook

161

"""Verify the integrity of the given revlog ``node`` while providing a hook

162

point for extensions to influence the operation."""

162

point for extensions to influence the operation."""

163

if skipflags:

163

if skipflags:

164

state[b'skipread'].add(node)

164

state[b'skipread'].add(node)

165

else:

165

else:

166

# Side-effect: read content and verify hash.

166

# Side-effect: read content and verify hash.

167

rl.revision(node)

167

rl.revision(node)

168

169

170

# True if a fast implementation for persistent-nodemap is available

170

# True if a fast implementation for persistent-nodemap is available

171

#

171

#

172

# We also consider we have a "fast" implementation in "pure" python because

172

# We also consider we have a "fast" implementation in "pure" python because

173

# people using pure don't really have performance consideration (and a

173

# people using pure don't really have performance consideration (and a

174

# wheelbarrow of other slowness source)

174

# wheelbarrow of other slowness source)

175

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or util.safehasattr(

175

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or util.safehasattr(

176

parsers, 'BaseIndexObject'

176

parsers, 'BaseIndexObject'

177

)

177

)

178

179

180

@attr.s(slots=True, frozen=True)

180

@attr.s(slots=True, frozen=True)

181

class _revisioninfo(object):

181

class _revisioninfo(object):

182

"""Information about a revision that allows building its fulltext

182

"""Information about a revision that allows building its fulltext

183

node: expected hash of the revision

183

node: expected hash of the revision

184

p1, p2: parent revs of the revision

184

p1, p2: parent revs of the revision

185

btext: built text cache consisting of a one-element list

185

btext: built text cache consisting of a one-element list

186

cachedelta: (baserev, uncompressed_delta) or None

186

cachedelta: (baserev, uncompressed_delta) or None

187

flags: flags associated to the revision storage

187

flags: flags associated to the revision storage

188

189

One of btext[0] or cachedelta must be set.

189

One of btext[0] or cachedelta must be set.

190

"""

190

"""

191

192

node = attr.ib()

192

node = attr.ib()

193

p1 = attr.ib()

193

p1 = attr.ib()

194

p2 = attr.ib()

194

p2 = attr.ib()

195

btext = attr.ib()

195

btext = attr.ib()

196

textlen = attr.ib()

196

textlen = attr.ib()

197

cachedelta = attr.ib()

197

cachedelta = attr.ib()

198

flags = attr.ib()

198

flags = attr.ib()

199

200

201

@interfaceutil.implementer(repository.irevisiondelta)

201

@interfaceutil.implementer(repository.irevisiondelta)

202

@attr.s(slots=True)

202

@attr.s(slots=True)

203

class revlogrevisiondelta(object):

203

class revlogrevisiondelta(object):

204

node = attr.ib()

204

node = attr.ib()

205

p1node = attr.ib()

205

p1node = attr.ib()

206

p2node = attr.ib()

206

p2node = attr.ib()

207

basenode = attr.ib()

207

basenode = attr.ib()

208

flags = attr.ib()

208

flags = attr.ib()

209

baserevisionsize = attr.ib()

209

baserevisionsize = attr.ib()

210

revision = attr.ib()

210

revision = attr.ib()

211

delta = attr.ib()

211

delta = attr.ib()

212

sidedata = attr.ib()

212

sidedata = attr.ib()

213

linknode = attr.ib(default=None)

213

linknode = attr.ib(default=None)

214

215

216

@interfaceutil.implementer(repository.iverifyproblem)

216

@interfaceutil.implementer(repository.iverifyproblem)

217

@attr.s(frozen=True)

217

@attr.s(frozen=True)

218

class revlogproblem(object):

218

class revlogproblem(object):

219

warning = attr.ib(default=None)

219

warning = attr.ib(default=None)

220

error = attr.ib(default=None)

220

error = attr.ib(default=None)

221

node = attr.ib(default=None)

221

node = attr.ib(default=None)

222

223

224

class revlogoldindex(list):

224

class revlogoldindex(list):

225

entry_size = INDEX_ENTRY_V0.size

225

entry_size = INDEX_ENTRY_V0.size

226

227

@property

227

@property

228

def nodemap(self):

228

def nodemap(self):

229

msg = b"index.nodemap is deprecated, use index.[has_node|rev|get_rev]"

229

msg = b"index.nodemap is deprecated, use index.[has_node|rev|get_rev]"

230

util.nouideprecwarn(msg, b'5.3', stacklevel=2)

230

util.nouideprecwarn(msg, b'5.3', stacklevel=2)

231

return self._nodemap

231

return self._nodemap

232

233

@util.propertycache

233

@util.propertycache

234

def _nodemap(self):

234

def _nodemap(self):

235

nodemap = nodemaputil.NodeMap({nullid: nullrev})

235

nodemap = nodemaputil.NodeMap({nullid: nullrev})

236

for r in range(0, len(self)):

236

for r in range(0, len(self)):

237

n = self[r][7]

237

n = self[r][7]

238

nodemap[n] = r

238

nodemap[n] = r

239

return nodemap

239

return nodemap

240

241

def has_node(self, node):

241

def has_node(self, node):

242

"""return True if the node exist in the index"""

242

"""return True if the node exist in the index"""

243

return node in self._nodemap

243

return node in self._nodemap

244

245

def rev(self, node):

245

def rev(self, node):

246

"""return a revision for a node

246

"""return a revision for a node

247

248

If the node is unknown, raise a RevlogError"""

248

If the node is unknown, raise a RevlogError"""

249

return self._nodemap[node]

249

return self._nodemap[node]

250

251

def get_rev(self, node):

251

def get_rev(self, node):

252

"""return a revision for a node

252

"""return a revision for a node

253

254

If the node is unknown, return None"""

254

If the node is unknown, return None"""

255

return self._nodemap.get(node)

255

return self._nodemap.get(node)

256

257

def append(self, tup):

257

def append(self, tup):

258

self._nodemap[tup[7]] = len(self)

258

self._nodemap[tup[7]] = len(self)

259

super(revlogoldindex, self).append(tup)

259

super(revlogoldindex, self).append(tup)

260

261

def __delitem__(self, i):

261

def __delitem__(self, i):

262

if not isinstance(i, slice) or not i.stop == -1 or i.step is not None:

262

if not isinstance(i, slice) or not i.stop == -1 or i.step is not None:

263

raise ValueError(b"deleting slices only supports a:-1 with step 1")

263

raise ValueError(b"deleting slices only supports a:-1 with step 1")

264

for r in pycompat.xrange(i.start, len(self)):

264

for r in pycompat.xrange(i.start, len(self)):

265

del self._nodemap[self[r][7]]

265

del self._nodemap[self[r][7]]

266

super(revlogoldindex, self).__delitem__(i)

266

super(revlogoldindex, self).__delitem__(i)

267

268

def clearcaches(self):

268

def clearcaches(self):

269

self.__dict__.pop('_nodemap', None)

269

self.__dict__.pop('_nodemap', None)

270

271

def __getitem__(self, i):

271

def __getitem__(self, i):

272

if i == -1:

272

if i == -1:

273

return (0, 0, 0, -1, -1, -1, -1, nullid)

273

return (0, 0, 0, -1, -1, -1, -1, nullid)

274

return list.__getitem__(self, i)

274

return list.__getitem__(self, i)

275

276

277

class revlogoldio(object):

277

class revlogoldio(object):

278

def parseindex(self, data, inline):

278

def parseindex(self, data, inline):

279

s = INDEX_ENTRY_V0.size

279

s = INDEX_ENTRY_V0.size

280

index = []

280

index = []

281

nodemap = nodemaputil.NodeMap({nullid: nullrev})

281

nodemap = nodemaputil.NodeMap({nullid: nullrev})

282

n = off = 0

282

n = off = 0

283

l = len(data)

283

l = len(data)

284

while off + s <= l:

284

while off + s <= l:

285

cur = data[off : off + s]

285

cur = data[off : off + s]

286

off += s

286

off += s

287

e = INDEX_ENTRY_V0.unpack(cur)

287

e = INDEX_ENTRY_V0.unpack(cur)

288

# transform to revlogv1 format

288

# transform to revlogv1 format

289

e2 = (

289

e2 = (

290

offset_type(e[0], 0),

290

offset_type(e[0], 0),

291

e[1],

291

e[1],

292

-1,

292

-1,

293

e[2],

293

e[2],

294

e[3],

294

e[3],

295

nodemap.get(e[4], nullrev),

295

nodemap.get(e[4], nullrev),

296

nodemap.get(e[5], nullrev),

296

nodemap.get(e[5], nullrev),

297

e[6],

297

e[6],

298

)

298

)

299

index.append(e2)

299

index.append(e2)

300

nodemap[e[6]] = n

300

nodemap[e[6]] = n

301

n += 1

301

n += 1

302

303

index = revlogoldindex(index)

303

index = revlogoldindex(index)

304

return index, None

304

return index, None

305

306

def packentry(self, entry, node, version, rev):

306

def packentry(self, entry, node, version, rev):

307

"""return the binary representation of an entry

307

"""return the binary representation of an entry

308

309

entry: a tuple containing all the values (see index.__getitem__)

309

entry: a tuple containing all the values (see index.__getitem__)

310

node: a callback to convert a revision to nodeid

310

node: a callback to convert a revision to nodeid

311

version: the changelog version

311

version: the changelog version

312

rev: the revision number

312

rev: the revision number

313

"""

313

"""

314

if gettype(entry[0]):

314

if gettype(entry[0]):

315

raise error.RevlogError(

315

raise error.RevlogError(

316

_(b'index entry flags need revlog version 1')

316

_(b'index entry flags need revlog version 1')

317

)

317

)

318

e2 = (

318

e2 = (

319

getoffset(entry[0]),

319

getoffset(entry[0]),

320

entry[1],

320

entry[1],

321

entry[3],

321

entry[3],

322

entry[4],

322

entry[4],

323

node(entry[5]),

323

node(entry[5]),

324

node(entry[6]),

324

node(entry[6]),

325

entry[7],

325

entry[7],

326

)

326

)

327

return INDEX_ENTRY_V0.pack(*e2)

327

return INDEX_ENTRY_V0.pack(*e2)

328

329

330

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

330

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

331

# signed integer)

331

# signed integer)

332

_maxentrysize = 0x7FFFFFFF

332

_maxentrysize = 0x7FFFFFFF

333

334

335

class revlogio(object):

335

class revlogio(object):

336

def parseindex(self, data, inline):

336

def parseindex(self, data, inline):

337

# call the C implementation to parse the index data

337

# call the C implementation to parse the index data

338

index, cache = parsers.parse_index2(data, inline)

338

index, cache = parsers.parse_index2(data, inline)

339

return index, cache

339

return index, cache

340

341

def packentry(self, entry, node, version, rev):

341

def packentry(self, entry, node, version, rev):

342

p = INDEX_ENTRY_V1.pack(*entry)

342

p = INDEX_ENTRY_V1.pack(*entry)

343

if rev == 0:

343

if rev == 0:

344

p = INDEX_HEADER.pack(version) + p[4:]

344

p = INDEX_HEADER.pack(version) + p[4:]

345

return p

345

return p

346

347

348

class revlogv2io(object):

348

class revlogv2io(object):

349

def parseindex(self, data, inline):

349

def parseindex(self, data, inline):

350

index, cache = parsers.parse_index2(data, inline, revlogv2=True)

350

index, cache = parsers.parse_index2(data, inline, revlogv2=True)

351

return index, cache

351

return index, cache

352

353

def packentry(self, entry, node, version, rev):

353

def packentry(self, entry, node, version, rev):

354

p = INDEX_ENTRY_V2.pack(*entry)

354

p = INDEX_ENTRY_V2.pack(*entry)

355

if rev == 0:

355

if rev == 0:

356

p = INDEX_HEADER.pack(version) + p[4:]

356

p = INDEX_HEADER.pack(version) + p[4:]

357

return p

357

return p

358

359

360

NodemapRevlogIO = None

360

NodemapRevlogIO = None

361

362

if util.safehasattr(parsers, 'parse_index_devel_nodemap'):

362

if util.safehasattr(parsers, 'parse_index_devel_nodemap'):

363

364

class NodemapRevlogIO(revlogio):

364

class NodemapRevlogIO(revlogio):

365

"""A debug oriented IO class that return a PersistentNodeMapIndexObject

365

"""A debug oriented IO class that return a PersistentNodeMapIndexObject

366

367

The PersistentNodeMapIndexObject object is meant to test the persistent nodemap feature.

367

The PersistentNodeMapIndexObject object is meant to test the persistent nodemap feature.

368

"""

368

"""

369

370

def parseindex(self, data, inline):

370

def parseindex(self, data, inline):

371

index, cache = parsers.parse_index_devel_nodemap(data, inline)

371

index, cache = parsers.parse_index_devel_nodemap(data, inline)

372

return index, cache

372

return index, cache

373

374

375

class rustrevlogio(revlogio):

375

class rustrevlogio(revlogio):

376

def parseindex(self, data, inline):

376

def parseindex(self, data, inline):

377

index, cache = super(rustrevlogio, self).parseindex(data, inline)

377

index, cache = super(rustrevlogio, self).parseindex(data, inline)

378

return rustrevlog.MixedIndex(index), cache

378

return rustrevlog.MixedIndex(index), cache

379

380

381

class revlog(object):

381

class revlog(object):

382

"""

382

"""

383

the underlying revision storage object

383

the underlying revision storage object

384

385

A revlog consists of two parts, an index and the revision data.

385

A revlog consists of two parts, an index and the revision data.

386

387

The index is a file with a fixed record size containing

387

The index is a file with a fixed record size containing

388

information on each revision, including its nodeid (hash), the

388

information on each revision, including its nodeid (hash), the

389

nodeids of its parents, the position and offset of its data within

389

nodeids of its parents, the position and offset of its data within

390

the data file, and the revision it's based on. Finally, each entry

390

the data file, and the revision it's based on. Finally, each entry

391

contains a linkrev entry that can serve as a pointer to external

391

contains a linkrev entry that can serve as a pointer to external

392

data.

392

data.

393

394

The revision data itself is a linear collection of data chunks.

394

The revision data itself is a linear collection of data chunks.

395

Each chunk represents a revision and is usually represented as a

395

Each chunk represents a revision and is usually represented as a

396

delta against the previous chunk. To bound lookup time, runs of

396

delta against the previous chunk. To bound lookup time, runs of

397

deltas are limited to about 2 times the length of the original

397

deltas are limited to about 2 times the length of the original

398

version data. This makes retrieval of a version proportional to

398

version data. This makes retrieval of a version proportional to

399

its size, or O(1) relative to the number of revisions.

399

its size, or O(1) relative to the number of revisions.

400

401

Both pieces of the revlog are written to in an append-only

401

Both pieces of the revlog are written to in an append-only

402

fashion, which means we never need to rewrite a file to insert or

402

fashion, which means we never need to rewrite a file to insert or

403

remove data, and can use some simple techniques to avoid the need

403

remove data, and can use some simple techniques to avoid the need

404

for locking while reading.

404

for locking while reading.

405

406

If checkambig, indexfile is opened with checkambig=True at

406

If checkambig, indexfile is opened with checkambig=True at

407

writing, to avoid file stat ambiguity.

407

writing, to avoid file stat ambiguity.

408

409

If mmaplargeindex is True, and an mmapindexthreshold is set, the

409

If mmaplargeindex is True, and an mmapindexthreshold is set, the

410

index will be mmapped rather than read if it is larger than the

410

index will be mmapped rather than read if it is larger than the

411

configured threshold.

411

configured threshold.

412

413

If censorable is True, the revlog can have censored revisions.

413

If censorable is True, the revlog can have censored revisions.

414

415

If `upperboundcomp` is not None, this is the expected maximal gain from

415

If `upperboundcomp` is not None, this is the expected maximal gain from

416

compression for the data content.

416

compression for the data content.

417

418

`concurrencychecker` is an optional function that receives 3 arguments: a

418

`concurrencychecker` is an optional function that receives 3 arguments: a

419

file handle, a filename, and an expected position. It should check whether

419

file handle, a filename, and an expected position. It should check whether

420

the current position in the file handle is valid, and log/warn/fail (by

420

the current position in the file handle is valid, and log/warn/fail (by

421

raising).

421

raising).

422

"""

422

"""

423

424

_flagserrorclass = error.RevlogError

424

_flagserrorclass = error.RevlogError

425

426

def __init__(

426

def __init__(

427

self,

427

self,

428

opener,

428

opener,

429

indexfile,

429

indexfile,

430

datafile=None,

430

datafile=None,

431

checkambig=False,

431

checkambig=False,

432

mmaplargeindex=False,

432

mmaplargeindex=False,

433

censorable=False,

433

censorable=False,

434

upperboundcomp=None,

434

upperboundcomp=None,

435

persistentnodemap=False,

435

persistentnodemap=False,

436

concurrencychecker=None,

436

concurrencychecker=None,

437

):

437

):

438

"""

438

"""

439

create a revlog object

439

create a revlog object

440

441

opener is a function that abstracts the file opening operation

441

opener is a function that abstracts the file opening operation

442

and can be used to implement COW semantics or the like.

442

and can be used to implement COW semantics or the like.

443

444

"""

444

"""

445

self.upperboundcomp = upperboundcomp

445

self.upperboundcomp = upperboundcomp

446

self.indexfile = indexfile

446

self.indexfile = indexfile

447

self.datafile = datafile or (indexfile[:-2] + b".d")

447

self.datafile = datafile or (indexfile[:-2] + b".d")

448

self.nodemap_file = None

448

self.nodemap_file = None

449

if persistentnodemap:

449

if persistentnodemap:

450

self.nodemap_file = nodemaputil.get_nodemap_file(

450

self.nodemap_file = nodemaputil.get_nodemap_file(

451

opener, self.indexfile

451

opener, self.indexfile

452

)

452

)

453

454

self.opener = opener

454

self.opener = opener

455

# When True, indexfile is opened with checkambig=True at writing, to

455

# When True, indexfile is opened with checkambig=True at writing, to

456

# avoid file stat ambiguity.

456

# avoid file stat ambiguity.

457

self._checkambig = checkambig

457

self._checkambig = checkambig

458

self._mmaplargeindex = mmaplargeindex

458

self._mmaplargeindex = mmaplargeindex

459

self._censorable = censorable

459

self._censorable = censorable

460

# 3-tuple of (node, rev, text) for a raw revision.

460

# 3-tuple of (node, rev, text) for a raw revision.

461

self._revisioncache = None

461

self._revisioncache = None

462

# Maps rev to chain base rev.

462

# Maps rev to chain base rev.

463

self._chainbasecache = util.lrucachedict(100)

463

self._chainbasecache = util.lrucachedict(100)

464

# 2-tuple of (offset, data) of raw data from the revlog at an offset.

464

# 2-tuple of (offset, data) of raw data from the revlog at an offset.

465

self._chunkcache = (0, b'')

465

self._chunkcache = (0, b'')

466

# How much data to read and cache into the raw revlog data cache.

466

# How much data to read and cache into the raw revlog data cache.

467

self._chunkcachesize = 65536

467

self._chunkcachesize = 65536

468

self._maxchainlen = None

468

self._maxchainlen = None

469

self._deltabothparents = True

469

self._deltabothparents = True

470

self.index = None

470

self.index = None

471

self._nodemap_docket = None

471

self._nodemap_docket = None

472

# Mapping of partial identifiers to full nodes.

472

# Mapping of partial identifiers to full nodes.

473

self._pcache = {}

473

self._pcache = {}

474

# Mapping of revision integer to full node.

474

# Mapping of revision integer to full node.

475

self._compengine = b'zlib'

475

self._compengine = b'zlib'

476

self._compengineopts = {}

476

self._compengineopts = {}

477

self._maxdeltachainspan = -1

477

self._maxdeltachainspan = -1

478

self._withsparseread = False

478

self._withsparseread = False

479

self._sparserevlog = False

479

self._sparserevlog = False

480

self._srdensitythreshold = 0.50

480

self._srdensitythreshold = 0.50

481

self._srmingapsize = 262144

481

self._srmingapsize = 262144

482

483

# Make copy of flag processors so each revlog instance can support

483

# Make copy of flag processors so each revlog instance can support

484

# custom flags.

484

# custom flags.

485

self._flagprocessors = dict(flagutil.flagprocessors)

485

self._flagprocessors = dict(flagutil.flagprocessors)

486

487

# 2-tuple of file handles being used for active writing.

487

# 2-tuple of file handles being used for active writing.

488

self._writinghandles = None

488

self._writinghandles = None

489

490

self._loadindex()

490

self._loadindex()

491

492

self._concurrencychecker = concurrencychecker

492

self._concurrencychecker = concurrencychecker

493

494

def _loadindex(self):

494

def _loadindex(self):

495

mmapindexthreshold = None

495

mmapindexthreshold = None

496

opts = self.opener.options

496

opts = self.opener.options

497

498

if b'revlogv2' in opts:

498

if b'revlogv2' in opts:

499

newversionflags = REVLOGV2 | FLAG_INLINE_DATA

499

newversionflags = REVLOGV2 | FLAG_INLINE_DATA

500

elif b'revlogv1' in opts:

500

elif b'revlogv1' in opts:

501

newversionflags = REVLOGV1 | FLAG_INLINE_DATA

501

newversionflags = REVLOGV1 | FLAG_INLINE_DATA

502

if b'generaldelta' in opts:

502

if b'generaldelta' in opts:

503

newversionflags |= FLAG_GENERALDELTA

503

newversionflags |= FLAG_GENERALDELTA

504

elif b'revlogv0' in self.opener.options:

504

elif b'revlogv0' in self.opener.options:

505

newversionflags = REVLOGV0

505

newversionflags = REVLOGV0

506

else:

506

else:

507

newversionflags = REVLOG_DEFAULT_VERSION

507

newversionflags = REVLOG_DEFAULT_VERSION

508

509

if b'chunkcachesize' in opts:

509

if b'chunkcachesize' in opts:

510

self._chunkcachesize = opts[b'chunkcachesize']

510

self._chunkcachesize = opts[b'chunkcachesize']

511

if b'maxchainlen' in opts:

511

if b'maxchainlen' in opts:

512

self._maxchainlen = opts[b'maxchainlen']

512

self._maxchainlen = opts[b'maxchainlen']

513

if b'deltabothparents' in opts:

513

if b'deltabothparents' in opts:

514

self._deltabothparents = opts[b'deltabothparents']

514

self._deltabothparents = opts[b'deltabothparents']

515

self._lazydelta = bool(opts.get(b'lazydelta', True))

515

self._lazydelta = bool(opts.get(b'lazydelta', True))

516

self._lazydeltabase = False

516

self._lazydeltabase = False

517

if self._lazydelta:

517

if self._lazydelta:

518

self._lazydeltabase = bool(opts.get(b'lazydeltabase', False))

518

self._lazydeltabase = bool(opts.get(b'lazydeltabase', False))

519

if b'compengine' in opts:

519

if b'compengine' in opts:

520

self._compengine = opts[b'compengine']

520

self._compengine = opts[b'compengine']

521

if b'zlib.level' in opts:

521

if b'zlib.level' in opts:

522

self._compengineopts[b'zlib.level'] = opts[b'zlib.level']

522

self._compengineopts[b'zlib.level'] = opts[b'zlib.level']

523

if b'zstd.level' in opts:

523

if b'zstd.level' in opts:

524

self._compengineopts[b'zstd.level'] = opts[b'zstd.level']

524

self._compengineopts[b'zstd.level'] = opts[b'zstd.level']

525

if b'maxdeltachainspan' in opts:

525

if b'maxdeltachainspan' in opts:

526

self._maxdeltachainspan = opts[b'maxdeltachainspan']

526

self._maxdeltachainspan = opts[b'maxdeltachainspan']

527

if self._mmaplargeindex and b'mmapindexthreshold' in opts:

527

if self._mmaplargeindex and b'mmapindexthreshold' in opts:

528

mmapindexthreshold = opts[b'mmapindexthreshold']

528

mmapindexthreshold = opts[b'mmapindexthreshold']

529

self.hassidedata = bool(opts.get(b'side-data', False))

529

self.hassidedata = bool(opts.get(b'side-data', False))

530

self._sparserevlog = bool(opts.get(b'sparse-revlog', False))

530

self._sparserevlog = bool(opts.get(b'sparse-revlog', False))

531

withsparseread = bool(opts.get(b'with-sparse-read', False))

531

withsparseread = bool(opts.get(b'with-sparse-read', False))

532

# sparse-revlog forces sparse-read

532

# sparse-revlog forces sparse-read

533

self._withsparseread = self._sparserevlog or withsparseread

533

self._withsparseread = self._sparserevlog or withsparseread

534

if b'sparse-read-density-threshold' in opts:

534

if b'sparse-read-density-threshold' in opts:

535

self._srdensitythreshold = opts[b'sparse-read-density-threshold']

535

self._srdensitythreshold = opts[b'sparse-read-density-threshold']

536

if b'sparse-read-min-gap-size' in opts:

536

if b'sparse-read-min-gap-size' in opts:

537

self._srmingapsize = opts[b'sparse-read-min-gap-size']

537

self._srmingapsize = opts[b'sparse-read-min-gap-size']

538

if opts.get(b'enableellipsis'):

538

if opts.get(b'enableellipsis'):

539

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

539

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

540

541

# revlog v0 doesn't have flag processors

541

# revlog v0 doesn't have flag processors

542

for flag, processor in pycompat.iteritems(

542

for flag, processor in pycompat.iteritems(

543

opts.get(b'flagprocessors', {})

543

opts.get(b'flagprocessors', {})

544

):

544

):

545

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

545

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

546

547

if self._chunkcachesize <= 0:

547

if self._chunkcachesize <= 0:

548

raise error.RevlogError(

548

raise error.RevlogError(

549

_(b'revlog chunk cache size %r is not greater than 0')

549

_(b'revlog chunk cache size %r is not greater than 0')

550

% self._chunkcachesize

550

% self._chunkcachesize

551

)

551

)

552

elif self._chunkcachesize & (self._chunkcachesize - 1):

552

elif self._chunkcachesize & (self._chunkcachesize - 1):

553

raise error.RevlogError(

553

raise error.RevlogError(

554

_(b'revlog chunk cache size %r is not a power of 2')

554

_(b'revlog chunk cache size %r is not a power of 2')

555

% self._chunkcachesize

555

% self._chunkcachesize

556

)

556

)

557

558

indexdata = b''

558

indexdata = b''

559

self._initempty = True

559

self._initempty = True

560

try:

560

try:

561

with self._indexfp() as f:

561

with self._indexfp() as f:

562

if (

562

if (

563

mmapindexthreshold is not None

563

mmapindexthreshold is not None

564

and self.opener.fstat(f).st_size >= mmapindexthreshold

564

and self.opener.fstat(f).st_size >= mmapindexthreshold

565

):

565

):

566

# TODO: should .close() to release resources without

566

# TODO: should .close() to release resources without

567

# relying on Python GC

567

# relying on Python GC

568

indexdata = util.buffer(util.mmapread(f))

568

indexdata = util.buffer(util.mmapread(f))

569

else:

569

else:

570

indexdata = f.read()

570

indexdata = f.read()

571

if len(indexdata) > 0:

571

if len(indexdata) > 0:

572

versionflags = INDEX_HEADER.unpack(indexdata[:4])[0]

572

versionflags = INDEX_HEADER.unpack(indexdata[:4])[0]

573

self._initempty = False

573

self._initempty = False

574

else:

574

else:

575

versionflags = newversionflags

575

versionflags = newversionflags

576

except IOError as inst:

576

except IOError as inst:

577

if inst.errno != errno.ENOENT:

577

if inst.errno != errno.ENOENT:

578

raise

578

raise

579

580

versionflags = newversionflags

580

versionflags = newversionflags

581

582

self.version = versionflags

582

self.version = versionflags

583

584

flags = versionflags & ~0xFFFF

584

flags = versionflags & ~0xFFFF

585

fmt = versionflags & 0xFFFF

585

fmt = versionflags & 0xFFFF

586

587

if fmt == REVLOGV0:

587

if fmt == REVLOGV0:

588

if flags:

588

if flags:

589

raise error.RevlogError(

589

raise error.RevlogError(

590

_(b'unknown flags (%#04x) in version %d revlog %s')

590

_(b'unknown flags (%#04x) in version %d revlog %s')

591

% (flags >> 16, fmt, self.indexfile)

591

% (flags >> 16, fmt, self.indexfile)

592

)

592

)

593

594

self._inline = False

594

self._inline = False

595

self._generaldelta = False

595

self._generaldelta = False

596

597

elif fmt == REVLOGV1:

597

elif fmt == REVLOGV1:

598

if flags & ~REVLOGV1_FLAGS:

598

if flags & ~REVLOGV1_FLAGS:

599

raise error.RevlogError(

599

raise error.RevlogError(

600

_(b'unknown flags (%#04x) in version %d revlog %s')

600

_(b'unknown flags (%#04x) in version %d revlog %s')

601

% (flags >> 16, fmt, self.indexfile)

601

% (flags >> 16, fmt, self.indexfile)

602

)

602

)

603

604

self._inline = versionflags & FLAG_INLINE_DATA

604

self._inline = versionflags & FLAG_INLINE_DATA

605

self._generaldelta = versionflags & FLAG_GENERALDELTA

605

self._generaldelta = versionflags & FLAG_GENERALDELTA

606

607

elif fmt == REVLOGV2:

607

elif fmt == REVLOGV2:

608

if flags & ~REVLOGV2_FLAGS:

608

if flags & ~REVLOGV2_FLAGS:

609

raise error.RevlogError(

609

raise error.RevlogError(

610

_(b'unknown flags (%#04x) in version %d revlog %s')

610

_(b'unknown flags (%#04x) in version %d revlog %s')

611

% (flags >> 16, fmt, self.indexfile)

611

% (flags >> 16, fmt, self.indexfile)

612

)

612

)

613

614

# There is a bug in the transaction handling when going from an

614

# There is a bug in the transaction handling when going from an

615

# inline revlog to a separate index and data file. Turn it off until

615

# inline revlog to a separate index and data file. Turn it off until

616

# it's fixed, since v2 revlogs sometimes get rewritten on exchange.

616

# it's fixed, since v2 revlogs sometimes get rewritten on exchange.

617

# See issue6485

617

# See issue6485

618

self._inline = False

618

self._inline = False

619

# generaldelta implied by version 2 revlogs.

619

# generaldelta implied by version 2 revlogs.

620

self._generaldelta = True

620

self._generaldelta = True

621

622

else:

622

else:

623

raise error.RevlogError(

623

raise error.RevlogError(

624

_(b'unknown version (%d) in revlog %s') % (fmt, self.indexfile)

624

_(b'unknown version (%d) in revlog %s') % (fmt, self.indexfile)

625

)

625

)

626

627

self.nodeconstants = sha1nodeconstants

627

self.nodeconstants = sha1nodeconstants

628

self.nullid = self.nodeconstants.nullid

628

self.nullid = self.nodeconstants.nullid

629

630

# sparse-revlog can't be on without general-delta (issue6056)

630

# sparse-revlog can't be on without general-delta (issue6056)

631

if not self._generaldelta:

631

if not self._generaldelta:

632

self._sparserevlog = False

632

self._sparserevlog = False

633

634

self._storedeltachains = True

634

self._storedeltachains = True

635

636

devel_nodemap = (

636

devel_nodemap = (

637

self.nodemap_file

637

self.nodemap_file

638

and opts.get(b'devel-force-nodemap', False)

638

and opts.get(b'devel-force-nodemap', False)

639

and NodemapRevlogIO is not None

639

and NodemapRevlogIO is not None

640

)

640

)

641

642

use_rust_index = False

642

use_rust_index = False

643

if rustrevlog is not None:

643

if rustrevlog is not None:

644

if self.nodemap_file is not None:

644

if self.nodemap_file is not None:

645

use_rust_index = True

645

use_rust_index = True

646

else:

646

else:

647

use_rust_index = self.opener.options.get(b'rust.index')

647

use_rust_index = self.opener.options.get(b'rust.index')

648

649

self._io = revlogio()

649

self._io = revlogio()

650

if self.version == REVLOGV0:

650

if self.version == REVLOGV0:

651

self._io = revlogoldio()

651

self._io = revlogoldio()

652

elif fmt == REVLOGV2:

652

elif fmt == REVLOGV2:

653

self._io = revlogv2io()

653

self._io = revlogv2io()

654

elif devel_nodemap:

654

elif devel_nodemap:

655

self._io = NodemapRevlogIO()

655

self._io = NodemapRevlogIO()

656

elif use_rust_index:

656

elif use_rust_index:

657

self._io = rustrevlogio()

657

self._io = rustrevlogio()

658

try:

658

try:

659

d = self._io.parseindex(indexdata, self._inline)

659

d = self._io.parseindex(indexdata, self._inline)

660

index, _chunkcache = d

660

index, _chunkcache = d

661

use_nodemap = (

661

use_nodemap = (

662

not self._inline

662

not self._inline

663

and self.nodemap_file is not None

663

and self.nodemap_file is not None

664

and util.safehasattr(index, 'update_nodemap_data')

664

and util.safehasattr(index, 'update_nodemap_data')

665

)

665

)

666

if use_nodemap:

666

if use_nodemap:

667

nodemap_data = nodemaputil.persisted_data(self)

667

nodemap_data = nodemaputil.persisted_data(self)

668

if nodemap_data is not None:

668

if nodemap_data is not None:

669

docket = nodemap_data[0]

669

docket = nodemap_data[0]

670

if (

670

if (

671

len(d[0]) > docket.tip_rev

671

len(d[0]) > docket.tip_rev

672

and d[0][docket.tip_rev][7] == docket.tip_node

672

and d[0][docket.tip_rev][7] == docket.tip_node

673

):

673

):

674

# no changelog tampering

674

# no changelog tampering

675

self._nodemap_docket = docket

675

self._nodemap_docket = docket

676

index.update_nodemap_data(*nodemap_data)

676

index.update_nodemap_data(*nodemap_data)

677

except (ValueError, IndexError):

677

except (ValueError, IndexError):

678

raise error.RevlogError(

678

raise error.RevlogError(

679

_(b"index %s is corrupted") % self.indexfile

679

_(b"index %s is corrupted") % self.indexfile

680

)

680

)

681

self.index, self._chunkcache = d

681

self.index, self._chunkcache = d

682

if not self._chunkcache:

682

if not self._chunkcache:

683

self._chunkclear()

683

self._chunkclear()

684

# revnum -> (chain-length, sum-delta-length)

684

# revnum -> (chain-length, sum-delta-length)

685

self._chaininfocache = util.lrucachedict(500)

685

self._chaininfocache = util.lrucachedict(500)

686

# revlog header -> revlog compressor

686

# revlog header -> revlog compressor

687

self._decompressors = {}

687

self._decompressors = {}

688

689

@util.propertycache

689

@util.propertycache

690

def _compressor(self):

690

def _compressor(self):

691

engine = util.compengines[self._compengine]

691

engine = util.compengines[self._compengine]

692

return engine.revlogcompressor(self._compengineopts)

692

return engine.revlogcompressor(self._compengineopts)

693

694

def _indexfp(self, mode=b'r'):

694

def _indexfp(self, mode=b'r'):

695

"""file object for the revlog's index file"""

695

"""file object for the revlog's index file"""

696

args = {'mode': mode}

696

args = {'mode': mode}

697

if mode != b'r':

697

if mode != b'r':

698

args['checkambig'] = self._checkambig

698

args['checkambig'] = self._checkambig

699

if mode == b'w':

699

if mode == b'w':

700

args['atomictemp'] = True

700

args['atomictemp'] = True

701

return self.opener(self.indexfile, **args)

701

return self.opener(self.indexfile, **args)

702

703

def _datafp(self, mode=b'r'):

703

def _datafp(self, mode=b'r'):

704

"""file object for the revlog's data file"""

704

"""file object for the revlog's data file"""

705

return self.opener(self.datafile, mode=mode)

705

return self.opener(self.datafile, mode=mode)

706

707

@contextlib.contextmanager

707

@contextlib.contextmanager

708

def _datareadfp(self, existingfp=None):

708

def _datareadfp(self, existingfp=None):

709

"""file object suitable to read data"""

709

"""file object suitable to read data"""

710

# Use explicit file handle, if given.

710

# Use explicit file handle, if given.

711

if existingfp is not None:

711

if existingfp is not None:

712

yield existingfp

712

yield existingfp

713

714

# Use a file handle being actively used for writes, if available.

714

# Use a file handle being actively used for writes, if available.

715

# There is some danger to doing this because reads will seek the

715

# There is some danger to doing this because reads will seek the

716

# file. However, _writeentry() performs a SEEK_END before all writes,

716

# file. However, _writeentry() performs a SEEK_END before all writes,

717

# so we should be safe.

717

# so we should be safe.

718

elif self._writinghandles:

718

elif self._writinghandles:

719

if self._inline:

719

if self._inline:

720

yield self._writinghandles[0]

720

yield self._writinghandles[0]

721

else:

721

else:

722

yield self._writinghandles[1]

722

yield self._writinghandles[1]

723

724

# Otherwise open a new file handle.

724

# Otherwise open a new file handle.

725

else:

725

else:

726

if self._inline:

726

if self._inline:

727

func = self._indexfp

727

func = self._indexfp

728

else:

728

else:

729

func = self._datafp

729

func = self._datafp

730

with func() as fp:

730

with func() as fp:

731

yield fp

731

yield fp

732

733

def tiprev(self):

733

def tiprev(self):

734

return len(self.index) - 1

734

return len(self.index) - 1

735

736

def tip(self):

736

def tip(self):

737

return self.node(self.tiprev())

737

return self.node(self.tiprev())

738

739

def __contains__(self, rev):

739

def __contains__(self, rev):

740

return 0 <= rev < len(self)

740

return 0 <= rev < len(self)

741

742

def __len__(self):

742

def __len__(self):

743

return len(self.index)

743

return len(self.index)

744

745

def __iter__(self):

745

def __iter__(self):

746

return iter(pycompat.xrange(len(self)))

746

return iter(pycompat.xrange(len(self)))

747

748

def revs(self, start=0, stop=None):

748

def revs(self, start=0, stop=None):

749

"""iterate over all rev in this revlog (from start to stop)"""

749

"""iterate over all rev in this revlog (from start to stop)"""

750

return storageutil.iterrevs(len(self), start=start, stop=stop)

750

return storageutil.iterrevs(len(self), start=start, stop=stop)

751

752

@property

752

@property

753

def nodemap(self):

753

def nodemap(self):

754

msg = (

754

msg = (

755

b"revlog.nodemap is deprecated, "

755

b"revlog.nodemap is deprecated, "

756

b"use revlog.index.[has_node|rev|get_rev]"

756

b"use revlog.index.[has_node|rev|get_rev]"

757

)

757

)

758

util.nouideprecwarn(msg, b'5.3', stacklevel=2)

758

util.nouideprecwarn(msg, b'5.3', stacklevel=2)

759

return self.index.nodemap

759

return self.index.nodemap

760

761

@property

761

@property

762

def _nodecache(self):

762

def _nodecache(self):

763

msg = b"revlog._nodecache is deprecated, use revlog.index.nodemap"

763

msg = b"revlog._nodecache is deprecated, use revlog.index.nodemap"

764

util.nouideprecwarn(msg, b'5.3', stacklevel=2)

764

util.nouideprecwarn(msg, b'5.3', stacklevel=2)

765

return self.index.nodemap

765

return self.index.nodemap

766

767

def hasnode(self, node):

767

def hasnode(self, node):

768

try:

768

try:

769

self.rev(node)

769

self.rev(node)

770

return True

770

return True

771

except KeyError:

771

except KeyError:

772

return False

772

return False

773

774

def candelta(self, baserev, rev):

774

def candelta(self, baserev, rev):

775

"""whether two revisions (baserev, rev) can be delta-ed or not"""

775

"""whether two revisions (baserev, rev) can be delta-ed or not"""

776

# Disable delta if either rev requires a content-changing flag

776

# Disable delta if either rev requires a content-changing flag

777

# processor (ex. LFS). This is because such flag processor can alter

777

# processor (ex. LFS). This is because such flag processor can alter

778

# the rawtext content that the delta will be based on, and two clients

778

# the rawtext content that the delta will be based on, and two clients

779

# could have a same revlog node with different flags (i.e. different

779

# could have a same revlog node with different flags (i.e. different

780

# rawtext contents) and the delta could be incompatible.

780

# rawtext contents) and the delta could be incompatible.

781

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

781

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

782

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

782

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

783

):

783

):

784

return False

784

return False

785

return True

785

return True

786

787

def update_caches(self, transaction):

787

def update_caches(self, transaction):

788

if self.nodemap_file is not None:

788

if self.nodemap_file is not None:

789

if transaction is None:

789

if transaction is None:

790

nodemaputil.update_persistent_nodemap(self)

790

nodemaputil.update_persistent_nodemap(self)

791

else:

791

else:

792

nodemaputil.setup_persistent_nodemap(transaction, self)

792

nodemaputil.setup_persistent_nodemap(transaction, self)

793

794

def clearcaches(self):

794

def clearcaches(self):

795

self._revisioncache = None

795

self._revisioncache = None

796

self._chainbasecache.clear()

796

self._chainbasecache.clear()

797

self._chunkcache = (0, b'')

797

self._chunkcache = (0, b'')

798

self._pcache = {}

798

self._pcache = {}

799

self._nodemap_docket = None

799

self._nodemap_docket = None

800

self.index.clearcaches()

800

self.index.clearcaches()

801

# The python code is the one responsible for validating the docket, we

801

# The python code is the one responsible for validating the docket, we

802

# end up having to refresh it here.

802

# end up having to refresh it here.

803

use_nodemap = (

803

use_nodemap = (

804

not self._inline

804

not self._inline

805

and self.nodemap_file is not None

805

and self.nodemap_file is not None

806

and util.safehasattr(self.index, 'update_nodemap_data')

806

and util.safehasattr(self.index, 'update_nodemap_data')

807

)

807

)

808

if use_nodemap:

808

if use_nodemap:

809

nodemap_data = nodemaputil.persisted_data(self)

809

nodemap_data = nodemaputil.persisted_data(self)

810

if nodemap_data is not None:

810

if nodemap_data is not None:

811

self._nodemap_docket = nodemap_data[0]

811

self._nodemap_docket = nodemap_data[0]

812

self.index.update_nodemap_data(*nodemap_data)

812

self.index.update_nodemap_data(*nodemap_data)

813

814

def rev(self, node):

814

def rev(self, node):

815

try:

815

try:

816

return self.index.rev(node)

816

return self.index.rev(node)

817

except TypeError:

817

except TypeError:

818

raise

818

raise

819

except error.RevlogError:

819

except error.RevlogError:

820

# parsers.c radix tree lookup failed

820

# parsers.c radix tree lookup failed

821

if node == wdirid or node in wdirfilenodeids:

821

if node == wdirid or node in wdirfilenodeids:

822

raise error.WdirUnsupported

822

raise error.WdirUnsupported

823

raise error.LookupError(node, self.indexfile, _(b'no node'))

823

raise error.LookupError(node, self.indexfile, _(b'no node'))

824

825

# Accessors for index entries.

825

# Accessors for index entries.

826

827

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

827

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

828

# are flags.

828

# are flags.

829

def start(self, rev):

829

def start(self, rev):

830

return int(self.index[rev][0] >> 16)

830

return int(self.index[rev][0] >> 16)

831

832

def flags(self, rev):

832

def flags(self, rev):

833

return self.index[rev][0] & 0xFFFF

833

return self.index[rev][0] & 0xFFFF

834

835

def length(self, rev):

835

def length(self, rev):

836

return self.index[rev][1]

836

return self.index[rev][1]

837

838

def sidedata_length(self, rev):

838

def sidedata_length(self, rev):

839

if self.version & 0xFFFF != REVLOGV2:

839

if self.version & 0xFFFF != REVLOGV2:

840

return 0

840

return 0

841

return self.index[rev][9]

841

return self.index[rev][9]

842

843

def rawsize(self, rev):

843

def rawsize(self, rev):

844

"""return the length of the uncompressed text for a given revision"""

844

"""return the length of the uncompressed text for a given revision"""

845

l = self.index[rev][2]

845

l = self.index[rev][2]

846

if l >= 0:

846

if l >= 0:

847

return l

847

return l

848

849

t = self.rawdata(rev)

849

t = self.rawdata(rev)

850

return len(t)

850

return len(t)

851

852

def size(self, rev):

852

def size(self, rev):

853

"""length of non-raw text (processed by a "read" flag processor)"""

853

"""length of non-raw text (processed by a "read" flag processor)"""

854

# fast path: if no "read" flag processor could change the content,

854

# fast path: if no "read" flag processor could change the content,

855

# size is rawsize. note: ELLIPSIS is known to not change the content.

855

# size is rawsize. note: ELLIPSIS is known to not change the content.

856

flags = self.flags(rev)

856

flags = self.flags(rev)

857

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

857

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

858

return self.rawsize(rev)

858

return self.rawsize(rev)

859

860

return len(self.revision(rev, raw=False))

860

return len(self.revision(rev, raw=False))

861

862

def chainbase(self, rev):

862

def chainbase(self, rev):

863

base = self._chainbasecache.get(rev)

863

base = self._chainbasecache.get(rev)

864

if base is not None:

864

if base is not None:

865

return base

865

return base

866

867

index = self.index

867

index = self.index

868

iterrev = rev

868

iterrev = rev

869

base = index[iterrev][3]

869

base = index[iterrev][3]

870

while base != iterrev:

870

while base != iterrev:

871

iterrev = base

871

iterrev = base

872

base = index[iterrev][3]

872

base = index[iterrev][3]

873

874

self._chainbasecache[rev] = base

874

self._chainbasecache[rev] = base

875

return base

875

return base

876

877

def linkrev(self, rev):

877

def linkrev(self, rev):

878

return self.index[rev][4]

878

return self.index[rev][4]

879

880

def parentrevs(self, rev):

880

def parentrevs(self, rev):

881

try:

881

try:

882

entry = self.index[rev]

882

entry = self.index[rev]

883

except IndexError:

883

except IndexError:

884

if rev == wdirrev:

884

if rev == wdirrev:

885

raise error.WdirUnsupported

885

raise error.WdirUnsupported

886

raise

886

raise

887

if entry[5] == nullrev:

887

888

return entry[6], entry[5]

889

else:

890

return entry[5], entry[6]

888

return entry[5], entry[6]

891

889

892

# fast parentrevs(rev) where rev isn't filtered

890

# fast parentrevs(rev) where rev isn't filtered

893

_uncheckedparentrevs = parentrevs

891

_uncheckedparentrevs = parentrevs

894

892

895

def node(self, rev):

893

def node(self, rev):

896

try:

894

try:

897

return self.index[rev][7]

895

return self.index[rev][7]

898

except IndexError:

896

except IndexError:

899

if rev == wdirrev:

897

if rev == wdirrev:

900

raise error.WdirUnsupported

898

raise error.WdirUnsupported

901

raise

899

raise

902

900

903

# Derived from index values.

901

# Derived from index values.

904

902

905

def end(self, rev):

903

def end(self, rev):

906

return self.start(rev) + self.length(rev)

904

return self.start(rev) + self.length(rev)

907

905

908

def parents(self, node):

906

def parents(self, node):

909

i = self.index

907

i = self.index

910

d = i[self.rev(node)]

908

d = i[self.rev(node)]

911

# inline node() to avoid function call overhead

909

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

912

if d[5] == nullid:

913

return i[d[6]][7], i[d[5]][7]

914

else:

915

return i[d[5]][7], i[d[6]][7]

916

910

917

def chainlen(self, rev):

911

def chainlen(self, rev):

918

return self._chaininfo(rev)[0]

912

return self._chaininfo(rev)[0]

919

913

920

def _chaininfo(self, rev):

914

def _chaininfo(self, rev):

921

chaininfocache = self._chaininfocache

915

chaininfocache = self._chaininfocache

922

if rev in chaininfocache:

916

if rev in chaininfocache:

923

return chaininfocache[rev]

917

return chaininfocache[rev]

924

index = self.index

918

index = self.index

925

generaldelta = self._generaldelta

919

generaldelta = self._generaldelta

926

iterrev = rev

920

iterrev = rev

927

e = index[iterrev]

921

e = index[iterrev]

928

clen = 0

922

clen = 0

929

compresseddeltalen = 0

923

compresseddeltalen = 0

930

while iterrev != e[3]:

924

while iterrev != e[3]:

931

clen += 1

925

clen += 1

932

compresseddeltalen += e[1]

926

compresseddeltalen += e[1]

933

if generaldelta:

927

if generaldelta:

934

iterrev = e[3]

928

iterrev = e[3]

935

else:

929

else:

936

iterrev -= 1

930

iterrev -= 1

937

if iterrev in chaininfocache:

931

if iterrev in chaininfocache:

938

t = chaininfocache[iterrev]

932

t = chaininfocache[iterrev]

939

clen += t[0]

933

clen += t[0]

940

compresseddeltalen += t[1]

934

compresseddeltalen += t[1]

941

break

935

break

942

e = index[iterrev]

936

e = index[iterrev]

943

else:

937

else:

944

# Add text length of base since decompressing that also takes

938

# Add text length of base since decompressing that also takes

945

# work. For cache hits the length is already included.

939

# work. For cache hits the length is already included.

946

compresseddeltalen += e[1]

940

compresseddeltalen += e[1]

947

r = (clen, compresseddeltalen)

941

r = (clen, compresseddeltalen)

948

chaininfocache[rev] = r

942

chaininfocache[rev] = r

949

return r

943

return r

950

944

951

def _deltachain(self, rev, stoprev=None):

945

def _deltachain(self, rev, stoprev=None):

952

"""Obtain the delta chain for a revision.

946

"""Obtain the delta chain for a revision.

953

947

954

``stoprev`` specifies a revision to stop at. If not specified, we

948

``stoprev`` specifies a revision to stop at. If not specified, we

955

stop at the base of the chain.

949

stop at the base of the chain.

956

950

957

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

951

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

958

revs in ascending order and ``stopped`` is a bool indicating whether

952

revs in ascending order and ``stopped`` is a bool indicating whether

959

``stoprev`` was hit.

953

``stoprev`` was hit.

960

"""

954

"""

961

# Try C implementation.

955

# Try C implementation.

962

try:

956

try:

963

return self.index.deltachain(rev, stoprev, self._generaldelta)

957

return self.index.deltachain(rev, stoprev, self._generaldelta)

964

except AttributeError:

958

except AttributeError:

965

pass

959

pass

966

960

967

chain = []

961

chain = []

968

962

969

# Alias to prevent attribute lookup in tight loop.

963

# Alias to prevent attribute lookup in tight loop.

970

index = self.index

964

index = self.index

971

generaldelta = self._generaldelta

965

generaldelta = self._generaldelta

972

966

973

iterrev = rev

967

iterrev = rev

974

e = index[iterrev]

968

e = index[iterrev]

975

while iterrev != e[3] and iterrev != stoprev:

969

while iterrev != e[3] and iterrev != stoprev:

976

chain.append(iterrev)

970

chain.append(iterrev)

977

if generaldelta:

971

if generaldelta:

978

iterrev = e[3]

972

iterrev = e[3]

979

else:

973

else:

980

iterrev -= 1

974

iterrev -= 1

981

e = index[iterrev]

975

e = index[iterrev]

982

976

983

if iterrev == stoprev:

977

if iterrev == stoprev:

984

stopped = True

978

stopped = True

985

else:

979

else:

986

chain.append(iterrev)

980

chain.append(iterrev)

987

stopped = False

981

stopped = False

988

982

989

chain.reverse()

983

chain.reverse()

990

return chain, stopped

984

return chain, stopped

991

985

992

def ancestors(self, revs, stoprev=0, inclusive=False):

986

def ancestors(self, revs, stoprev=0, inclusive=False):

993

"""Generate the ancestors of 'revs' in reverse revision order.

987

"""Generate the ancestors of 'revs' in reverse revision order.

994

Does not generate revs lower than stoprev.

988

Does not generate revs lower than stoprev.

995

989

996

See the documentation for ancestor.lazyancestors for more details."""

990

See the documentation for ancestor.lazyancestors for more details."""

997

991

998

# first, make sure start revisions aren't filtered

992

# first, make sure start revisions aren't filtered

999

revs = list(revs)

993

revs = list(revs)

1000

checkrev = self.node

994

checkrev = self.node

1001

for r in revs:

995

for r in revs:

1002

checkrev(r)

996

checkrev(r)

1003

# and we're sure ancestors aren't filtered as well

997

# and we're sure ancestors aren't filtered as well

1004

998

1005

if rustancestor is not None:

999

if rustancestor is not None:

1006

lazyancestors = rustancestor.LazyAncestors

1000

lazyancestors = rustancestor.LazyAncestors

1007

arg = self.index

1001

arg = self.index

1008

else:

1002

else:

1009

lazyancestors = ancestor.lazyancestors

1003

lazyancestors = ancestor.lazyancestors

1010

arg = self._uncheckedparentrevs

1004

arg = self._uncheckedparentrevs

1011

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

1005

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

1012

1006

1013

def descendants(self, revs):

1007

def descendants(self, revs):

1014

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

1008

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

1015

1009

1016

def findcommonmissing(self, common=None, heads=None):

1010

def findcommonmissing(self, common=None, heads=None):

1017

"""Return a tuple of the ancestors of common and the ancestors of heads

1011

"""Return a tuple of the ancestors of common and the ancestors of heads

1018

that are not ancestors of common. In revset terminology, we return the

1012

that are not ancestors of common. In revset terminology, we return the

1019

tuple:

1013

tuple:

1020

1014

1021

::common, (::heads) - (::common)

1015

::common, (::heads) - (::common)

1022

1016

1023

The list is sorted by revision number, meaning it is

1017

The list is sorted by revision number, meaning it is

1024

topologically sorted.

1018

topologically sorted.

1025

1019

1026

'heads' and 'common' are both lists of node IDs. If heads is

1020

'heads' and 'common' are both lists of node IDs. If heads is

1027

not supplied, uses all of the revlog's heads. If common is not

1021

not supplied, uses all of the revlog's heads. If common is not

1028

supplied, uses nullid."""

1022

supplied, uses nullid."""

1029

if common is None:

1023

if common is None:

1030

common = [nullid]

1024

common = [nullid]

1031

if heads is None:

1025

if heads is None:

1032

heads = self.heads()

1026

heads = self.heads()

1033

1027

1034

common = [self.rev(n) for n in common]

1028

common = [self.rev(n) for n in common]

1035

heads = [self.rev(n) for n in heads]

1029

heads = [self.rev(n) for n in heads]

1036

1030

1037

# we want the ancestors, but inclusive

1031

# we want the ancestors, but inclusive

1038

class lazyset(object):

1032

class lazyset(object):

1039

def __init__(self, lazyvalues):

1033

def __init__(self, lazyvalues):

1040

self.addedvalues = set()

1034

self.addedvalues = set()

1041

self.lazyvalues = lazyvalues

1035

self.lazyvalues = lazyvalues

1042

1036

1043

def __contains__(self, value):

1037

def __contains__(self, value):

1044

return value in self.addedvalues or value in self.lazyvalues

1038

return value in self.addedvalues or value in self.lazyvalues

1045

1039

1046

def __iter__(self):

1040

def __iter__(self):

1047

added = self.addedvalues

1041

added = self.addedvalues

1048

for r in added:

1042

for r in added:

1049

yield r

1043

yield r

1050

for r in self.lazyvalues:

1044

for r in self.lazyvalues:

1051

if not r in added:

1045

if not r in added:

1052

yield r

1046

yield r

1053

1047

1054

def add(self, value):

1048

def add(self, value):

1055

self.addedvalues.add(value)

1049

self.addedvalues.add(value)

1056

1050

1057

def update(self, values):

1051

def update(self, values):

1058

self.addedvalues.update(values)

1052

self.addedvalues.update(values)

1059

1053

1060

has = lazyset(self.ancestors(common))

1054

has = lazyset(self.ancestors(common))

1061

has.add(nullrev)

1055

has.add(nullrev)

1062

has.update(common)

1056

has.update(common)

1063

1057

1064

# take all ancestors from heads that aren't in has

1058

# take all ancestors from heads that aren't in has

1065

missing = set()

1059

missing = set()

1066

visit = collections.deque(r for r in heads if r not in has)

1060

visit = collections.deque(r for r in heads if r not in has)

1067

while visit:

1061

while visit:

1068

r = visit.popleft()

1062

r = visit.popleft()

1069

if r in missing:

1063

if r in missing:

1070

continue

1064

continue

1071

else:

1065

else:

1072

missing.add(r)

1066

missing.add(r)

1073

for p in self.parentrevs(r):

1067

for p in self.parentrevs(r):

1074

if p not in has:

1068

if p not in has:

1075

visit.append(p)

1069

visit.append(p)

1076

missing = list(missing)

1070

missing = list(missing)

1077

missing.sort()

1071

missing.sort()

1078

return has, [self.node(miss) for miss in missing]

1072

return has, [self.node(miss) for miss in missing]

1079

1073

1080

def incrementalmissingrevs(self, common=None):

1074

def incrementalmissingrevs(self, common=None):

1081

"""Return an object that can be used to incrementally compute the

1075

"""Return an object that can be used to incrementally compute the

1082

revision numbers of the ancestors of arbitrary sets that are not

1076

revision numbers of the ancestors of arbitrary sets that are not

1083

ancestors of common. This is an ancestor.incrementalmissingancestors

1077

ancestors of common. This is an ancestor.incrementalmissingancestors

1084

object.

1078

object.

1085

1079

1086

'common' is a list of revision numbers. If common is not supplied, uses

1080

'common' is a list of revision numbers. If common is not supplied, uses

1087

nullrev.

1081

nullrev.

1088

"""

1082

"""

1089

if common is None:

1083

if common is None:

1090

common = [nullrev]

1084

common = [nullrev]

1091

1085

1092

if rustancestor is not None:

1086

if rustancestor is not None:

1093

return rustancestor.MissingAncestors(self.index, common)

1087

return rustancestor.MissingAncestors(self.index, common)

1094

return ancestor.incrementalmissingancestors(self.parentrevs, common)

1088

return ancestor.incrementalmissingancestors(self.parentrevs, common)

1095

1089

1096

def findmissingrevs(self, common=None, heads=None):

1090

def findmissingrevs(self, common=None, heads=None):

1097

"""Return the revision numbers of the ancestors of heads that

1091

"""Return the revision numbers of the ancestors of heads that

1098

are not ancestors of common.

1092

are not ancestors of common.

1099

1093

1100

More specifically, return a list of revision numbers corresponding to

1094

More specifically, return a list of revision numbers corresponding to

1101

nodes N such that every N satisfies the following constraints:

1095

nodes N such that every N satisfies the following constraints:

1102

1096

1103

1. N is an ancestor of some node in 'heads'

1097

1. N is an ancestor of some node in 'heads'

1104

2. N is not an ancestor of any node in 'common'

1098

2. N is not an ancestor of any node in 'common'

1105

1099

1106

The list is sorted by revision number, meaning it is

1100

The list is sorted by revision number, meaning it is

1107

topologically sorted.

1101

topologically sorted.

1108

1102

1109

'heads' and 'common' are both lists of revision numbers. If heads is

1103

'heads' and 'common' are both lists of revision numbers. If heads is

1110

not supplied, uses all of the revlog's heads. If common is not

1104

not supplied, uses all of the revlog's heads. If common is not

1111

supplied, uses nullid."""

1105

supplied, uses nullid."""

1112

if common is None:

1106

if common is None:

1113

common = [nullrev]

1107

common = [nullrev]

1114

if heads is None:

1108

if heads is None:

1115

heads = self.headrevs()

1109

heads = self.headrevs()

1116

1110

1117

inc = self.incrementalmissingrevs(common=common)

1111

inc = self.incrementalmissingrevs(common=common)

1118

return inc.missingancestors(heads)

1112

return inc.missingancestors(heads)

1119

1113

1120

def findmissing(self, common=None, heads=None):

1114

def findmissing(self, common=None, heads=None):

1121

"""Return the ancestors of heads that are not ancestors of common.

1115

"""Return the ancestors of heads that are not ancestors of common.

1122

1116

1123

More specifically, return a list of nodes N such that every N

1117

More specifically, return a list of nodes N such that every N

1124

satisfies the following constraints:

1118

satisfies the following constraints:

1125

1119

1126

1. N is an ancestor of some node in 'heads'

1120

1. N is an ancestor of some node in 'heads'

1127

2. N is not an ancestor of any node in 'common'

1121

2. N is not an ancestor of any node in 'common'

1128

1122

1129

The list is sorted by revision number, meaning it is

1123

The list is sorted by revision number, meaning it is

1130

topologically sorted.

1124

topologically sorted.

1131

1125

1132

'heads' and 'common' are both lists of node IDs. If heads is

1126

'heads' and 'common' are both lists of node IDs. If heads is

1133

not supplied, uses all of the revlog's heads. If common is not

1127

not supplied, uses all of the revlog's heads. If common is not

1134

supplied, uses nullid."""

1128

supplied, uses nullid."""

1135

if common is None:

1129

if common is None:

1136

common = [nullid]

1130

common = [nullid]

1137

if heads is None:

1131

if heads is None:

1138

heads = self.heads()

1132

heads = self.heads()

1139

1133

1140

common = [self.rev(n) for n in common]

1134

common = [self.rev(n) for n in common]

1141

heads = [self.rev(n) for n in heads]

1135

heads = [self.rev(n) for n in heads]

1142

1136

1143

inc = self.incrementalmissingrevs(common=common)

1137

inc = self.incrementalmissingrevs(common=common)

1144

return [self.node(r) for r in inc.missingancestors(heads)]

1138

return [self.node(r) for r in inc.missingancestors(heads)]

1145

1139

1146

def nodesbetween(self, roots=None, heads=None):

1140

def nodesbetween(self, roots=None, heads=None):

1147

"""Return a topological path from 'roots' to 'heads'.

1141

"""Return a topological path from 'roots' to 'heads'.

1148

1142

1149

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

1143

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

1150

topologically sorted list of all nodes N that satisfy both of

1144

topologically sorted list of all nodes N that satisfy both of

1151

these constraints:

1145

these constraints:

1152

1146

1153

1. N is a descendant of some node in 'roots'

1147

1. N is a descendant of some node in 'roots'

1154

2. N is an ancestor of some node in 'heads'

1148

2. N is an ancestor of some node in 'heads'

1155

1149

1156

Every node is considered to be both a descendant and an ancestor

1150

Every node is considered to be both a descendant and an ancestor

1157

of itself, so every reachable node in 'roots' and 'heads' will be

1151

of itself, so every reachable node in 'roots' and 'heads' will be

1158

included in 'nodes'.

1152

included in 'nodes'.

1159

1153

1160

'outroots' is the list of reachable nodes in 'roots', i.e., the

1154

'outroots' is the list of reachable nodes in 'roots', i.e., the

1161

subset of 'roots' that is returned in 'nodes'. Likewise,

1155

subset of 'roots' that is returned in 'nodes'. Likewise,

1162

'outheads' is the subset of 'heads' that is also in 'nodes'.

1156

'outheads' is the subset of 'heads' that is also in 'nodes'.

1163

1157

1164

'roots' and 'heads' are both lists of node IDs. If 'roots' is

1158

'roots' and 'heads' are both lists of node IDs. If 'roots' is

1165

unspecified, uses nullid as the only root. If 'heads' is

1159

unspecified, uses nullid as the only root. If 'heads' is

1166

unspecified, uses list of all of the revlog's heads."""

1160

unspecified, uses list of all of the revlog's heads."""

1167

nonodes = ([], [], [])

1161

nonodes = ([], [], [])

1168

if roots is not None:

1162

if roots is not None:

1169

roots = list(roots)

1163

roots = list(roots)

1170

if not roots:

1164

if not roots:

1171

return nonodes

1165

return nonodes

1172

lowestrev = min([self.rev(n) for n in roots])

1166

lowestrev = min([self.rev(n) for n in roots])

1173

else:

1167

else:

1174

roots = [nullid] # Everybody's a descendant of nullid

1168

roots = [nullid] # Everybody's a descendant of nullid

1175

lowestrev = nullrev

1169

lowestrev = nullrev

1176

if (lowestrev == nullrev) and (heads is None):

1170

if (lowestrev == nullrev) and (heads is None):

1177

# We want _all_ the nodes!

1171

# We want _all_ the nodes!

1178

return ([self.node(r) for r in self], [nullid], list(self.heads()))

1172

return ([self.node(r) for r in self], [nullid], list(self.heads()))

1179

if heads is None:

1173

if heads is None:

1180

# All nodes are ancestors, so the latest ancestor is the last

1174

# All nodes are ancestors, so the latest ancestor is the last

1181

# node.

1175

# node.

1182

highestrev = len(self) - 1

1176

highestrev = len(self) - 1

1183

# Set ancestors to None to signal that every node is an ancestor.

1177

# Set ancestors to None to signal that every node is an ancestor.

1184

ancestors = None

1178

ancestors = None

1185

# Set heads to an empty dictionary for later discovery of heads

1179

# Set heads to an empty dictionary for later discovery of heads

1186

heads = {}

1180

heads = {}

1187

else:

1181

else:

1188

heads = list(heads)

1182

heads = list(heads)

1189

if not heads:

1183

if not heads:

1190

return nonodes

1184

return nonodes

1191

ancestors = set()

1185

ancestors = set()

1192

# Turn heads into a dictionary so we can remove 'fake' heads.

1186

# Turn heads into a dictionary so we can remove 'fake' heads.

1193

# Also, later we will be using it to filter out the heads we can't

1187

# Also, later we will be using it to filter out the heads we can't

1194

# find from roots.

1188

# find from roots.

1195

heads = dict.fromkeys(heads, False)

1189

heads = dict.fromkeys(heads, False)

1196

# Start at the top and keep marking parents until we're done.

1190

# Start at the top and keep marking parents until we're done.

1197

nodestotag = set(heads)

1191

nodestotag = set(heads)

1198

# Remember where the top was so we can use it as a limit later.

1192

# Remember where the top was so we can use it as a limit later.

1199

highestrev = max([self.rev(n) for n in nodestotag])

1193

highestrev = max([self.rev(n) for n in nodestotag])

1200

while nodestotag:

1194

while nodestotag:

1201

# grab a node to tag

1195

# grab a node to tag

1202

n = nodestotag.pop()

1196

n = nodestotag.pop()

1203

# Never tag nullid

1197

# Never tag nullid

1204

if n == nullid:

1198

if n == nullid:

1205

continue

1199

continue

1206

# A node's revision number represents its place in a

1200

# A node's revision number represents its place in a

1207

# topologically sorted list of nodes.

1201

# topologically sorted list of nodes.

1208

r = self.rev(n)

1202

r = self.rev(n)

1209

if r >= lowestrev:

1203

if r >= lowestrev:

1210

if n not in ancestors:

1204

if n not in ancestors:

1211

# If we are possibly a descendant of one of the roots

1205

# If we are possibly a descendant of one of the roots

1212

# and we haven't already been marked as an ancestor

1206

# and we haven't already been marked as an ancestor

1213

ancestors.add(n) # Mark as ancestor

1207

ancestors.add(n) # Mark as ancestor

1214

# Add non-nullid parents to list of nodes to tag.

1208

# Add non-nullid parents to list of nodes to tag.

1215

nodestotag.update(

1209

nodestotag.update(

1216

[p for p in self.parents(n) if p != nullid]

1210

[p for p in self.parents(n) if p != nullid]

1217

)

1211

)

1218

elif n in heads: # We've seen it before, is it a fake head?

1212

elif n in heads: # We've seen it before, is it a fake head?

1219

# So it is, real heads should not be the ancestors of

1213

# So it is, real heads should not be the ancestors of

1220

# any other heads.

1214

# any other heads.

1221

heads.pop(n)

1215

heads.pop(n)

1222

if not ancestors:

1216

if not ancestors:

1223

return nonodes

1217

return nonodes

1224

# Now that we have our set of ancestors, we want to remove any

1218

# Now that we have our set of ancestors, we want to remove any

1225

# roots that are not ancestors.

1219

# roots that are not ancestors.

1226

1220

1227

# If one of the roots was nullid, everything is included anyway.

1221

# If one of the roots was nullid, everything is included anyway.

1228

if lowestrev > nullrev:

1222

if lowestrev > nullrev:

1229

# But, since we weren't, let's recompute the lowest rev to not

1223

# But, since we weren't, let's recompute the lowest rev to not

1230

# include roots that aren't ancestors.

1224

# include roots that aren't ancestors.

1231

1225

1232

# Filter out roots that aren't ancestors of heads

1226

# Filter out roots that aren't ancestors of heads

1233

roots = [root for root in roots if root in ancestors]

1227

roots = [root for root in roots if root in ancestors]

1234

# Recompute the lowest revision

1228

# Recompute the lowest revision

1235

if roots:

1229

if roots:

1236

lowestrev = min([self.rev(root) for root in roots])

1230

lowestrev = min([self.rev(root) for root in roots])

1237

else:

1231

else:

1238

# No more roots? Return empty list

1232

# No more roots? Return empty list

1239

return nonodes

1233

return nonodes

1240

else:

1234

else:

1241

# We are descending from nullid, and don't need to care about

1235

# We are descending from nullid, and don't need to care about

1242

# any other roots.

1236

# any other roots.

1243

lowestrev = nullrev

1237

lowestrev = nullrev

1244

roots = [nullid]

1238

roots = [nullid]

1245

# Transform our roots list into a set.

1239

# Transform our roots list into a set.

1246

descendants = set(roots)

1240

descendants = set(roots)

1247

# Also, keep the original roots so we can filter out roots that aren't

1241

# Also, keep the original roots so we can filter out roots that aren't

1248

# 'real' roots (i.e. are descended from other roots).

1242

# 'real' roots (i.e. are descended from other roots).

1249

roots = descendants.copy()

1243

roots = descendants.copy()

1250

# Our topologically sorted list of output nodes.

1244

# Our topologically sorted list of output nodes.

1251

orderedout = []

1245

orderedout = []

1252

# Don't start at nullid since we don't want nullid in our output list,

1246

# Don't start at nullid since we don't want nullid in our output list,

1253

# and if nullid shows up in descendants, empty parents will look like

1247

# and if nullid shows up in descendants, empty parents will look like

1254

# they're descendants.

1248

# they're descendants.

1255

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

1249

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

1256

n = self.node(r)

1250

n = self.node(r)

1257

isdescendant = False

1251

isdescendant = False

1258

if lowestrev == nullrev: # Everybody is a descendant of nullid

1252

if lowestrev == nullrev: # Everybody is a descendant of nullid

1259

isdescendant = True

1253

isdescendant = True

1260

elif n in descendants:

1254

elif n in descendants:

1261

# n is already a descendant

1255

# n is already a descendant

1262

isdescendant = True

1256

isdescendant = True

1263

# This check only needs to be done here because all the roots

1257

# This check only needs to be done here because all the roots

1264

# will start being marked is descendants before the loop.

1258

# will start being marked is descendants before the loop.

1265

if n in roots:

1259

if n in roots:

1266

# If n was a root, check if it's a 'real' root.

1260

# If n was a root, check if it's a 'real' root.

1267

p = tuple(self.parents(n))

1261

p = tuple(self.parents(n))

1268

# If any of its parents are descendants, it's not a root.

1262

# If any of its parents are descendants, it's not a root.

1269

if (p[0] in descendants) or (p[1] in descendants):

1263

if (p[0] in descendants) or (p[1] in descendants):

1270

roots.remove(n)

1264

roots.remove(n)

1271

else:

1265

else:

1272

p = tuple(self.parents(n))

1266

p = tuple(self.parents(n))

1273

# A node is a descendant if either of its parents are

1267

# A node is a descendant if either of its parents are

1274

# descendants. (We seeded the dependents list with the roots

1268

# descendants. (We seeded the dependents list with the roots

1275

# up there, remember?)

1269

# up there, remember?)

1276

if (p[0] in descendants) or (p[1] in descendants):

1270

if (p[0] in descendants) or (p[1] in descendants):

1277

descendants.add(n)

1271

descendants.add(n)

1278

isdescendant = True

1272

isdescendant = True

1279

if isdescendant and ((ancestors is None) or (n in ancestors)):

1273

if isdescendant and ((ancestors is None) or (n in ancestors)):

1280

# Only include nodes that are both descendants and ancestors.

1274

# Only include nodes that are both descendants and ancestors.

1281

orderedout.append(n)

1275

orderedout.append(n)

1282

if (ancestors is not None) and (n in heads):

1276

if (ancestors is not None) and (n in heads):

1283

# We're trying to figure out which heads are reachable

1277

# We're trying to figure out which heads are reachable

1284

# from roots.

1278

# from roots.

1285

# Mark this head as having been reached

1279

# Mark this head as having been reached

1286

heads[n] = True

1280

heads[n] = True

1287

elif ancestors is None:

1281

elif ancestors is None:

1288

# Otherwise, we're trying to discover the heads.

1282

# Otherwise, we're trying to discover the heads.

1289

# Assume this is a head because if it isn't, the next step

1283

# Assume this is a head because if it isn't, the next step

1290

# will eventually remove it.

1284

# will eventually remove it.

1291

heads[n] = True

1285

heads[n] = True

1292

# But, obviously its parents aren't.

1286

# But, obviously its parents aren't.

1293

for p in self.parents(n):

1287

for p in self.parents(n):

1294

heads.pop(p, None)

1288

heads.pop(p, None)

1295

heads = [head for head, flag in pycompat.iteritems(heads) if flag]

1289

heads = [head for head, flag in pycompat.iteritems(heads) if flag]

1296

roots = list(roots)

1290

roots = list(roots)

1297

assert orderedout

1291

assert orderedout

1298

assert roots

1292

assert roots

1299

assert heads

1293

assert heads

1300

return (orderedout, roots, heads)

1294

return (orderedout, roots, heads)

1301

1295

1302

def headrevs(self, revs=None):

1296

def headrevs(self, revs=None):

1303

if revs is None:

1297

if revs is None:

1304

try:

1298

try:

1305

return self.index.headrevs()

1299

return self.index.headrevs()

1306

except AttributeError:

1300

except AttributeError:

1307

return self._headrevs()

1301

return self._headrevs()

1308

if rustdagop is not None:

1302

if rustdagop is not None:

1309

return rustdagop.headrevs(self.index, revs)

1303

return rustdagop.headrevs(self.index, revs)

1310

return dagop.headrevs(revs, self._uncheckedparentrevs)

1304

return dagop.headrevs(revs, self._uncheckedparentrevs)

1311

1305

1312

def computephases(self, roots):

1306

def computephases(self, roots):

1313

return self.index.computephasesmapsets(roots)

1307

return self.index.computephasesmapsets(roots)

1314

1308

1315

def _headrevs(self):

1309

def _headrevs(self):

1316

count = len(self)

1310

count = len(self)

1317

if not count:

1311

if not count:

1318

return [nullrev]

1312

return [nullrev]

1319

# we won't iter over filtered rev so nobody is a head at start

1313

# we won't iter over filtered rev so nobody is a head at start

1320

ishead = [0] * (count + 1)

1314

ishead = [0] * (count + 1)

1321

index = self.index

1315

index = self.index

1322

for r in self:

1316

for r in self:

1323

ishead[r] = 1 # I may be an head

1317

ishead[r] = 1 # I may be an head

1324

e = index[r]

1318

e = index[r]

1325

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

1319

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

1326

return [r for r, val in enumerate(ishead) if val]

1320

return [r for r, val in enumerate(ishead) if val]

1327

1321

1328

def heads(self, start=None, stop=None):

1322

def heads(self, start=None, stop=None):

1329

"""return the list of all nodes that have no children

1323

"""return the list of all nodes that have no children

1330

1324

1331

if start is specified, only heads that are descendants of

1325

if start is specified, only heads that are descendants of

1332

start will be returned

1326

start will be returned

1333

if stop is specified, it will consider all the revs from stop

1327

if stop is specified, it will consider all the revs from stop

1334

as if they had no children

1328

as if they had no children

1335

"""

1329

"""

1336

if start is None and stop is None:

1330

if start is None and stop is None:

1337

if not len(self):

1331

if not len(self):

1338

return [nullid]

1332

return [nullid]

1339

return [self.node(r) for r in self.headrevs()]

1333

return [self.node(r) for r in self.headrevs()]

1340

1334

1341

if start is None:

1335

if start is None:

1342

start = nullrev

1336

start = nullrev

1343

else:

1337

else:

1344

start = self.rev(start)

1338

start = self.rev(start)

1345

1339

1346

stoprevs = {self.rev(n) for n in stop or []}

1340

stoprevs = {self.rev(n) for n in stop or []}

1347

1341

1348

revs = dagop.headrevssubset(

1342

revs = dagop.headrevssubset(

1349

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

1343

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

1350

)

1344

)

1351

1345

1352

return [self.node(rev) for rev in revs]

1346

return [self.node(rev) for rev in revs]

1353

1347

1354

def children(self, node):

1348

def children(self, node):

1355

"""find the children of a given node"""

1349

"""find the children of a given node"""

1356

c = []

1350

c = []

1357

p = self.rev(node)

1351

p = self.rev(node)

1358

for r in self.revs(start=p + 1):

1352

for r in self.revs(start=p + 1):

1359

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

1353

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

1360

if prevs:

1354

if prevs:

1361

for pr in prevs:

1355

for pr in prevs:

1362

if pr == p:

1356

if pr == p:

1363

c.append(self.node(r))

1357

c.append(self.node(r))

1364

elif p == nullrev:

1358

elif p == nullrev:

1365

c.append(self.node(r))

1359

c.append(self.node(r))

1366

return c

1360

return c

1367

1361

1368

def commonancestorsheads(self, a, b):

1362

def commonancestorsheads(self, a, b):

1369

"""calculate all the heads of the common ancestors of nodes a and b"""

1363

"""calculate all the heads of the common ancestors of nodes a and b"""

1370

a, b = self.rev(a), self.rev(b)

1364

a, b = self.rev(a), self.rev(b)

1371

ancs = self._commonancestorsheads(a, b)

1365

ancs = self._commonancestorsheads(a, b)

1372

return pycompat.maplist(self.node, ancs)

1366

return pycompat.maplist(self.node, ancs)

1373

1367

1374

def _commonancestorsheads(self, *revs):

1368

def _commonancestorsheads(self, *revs):

1375

"""calculate all the heads of the common ancestors of revs"""

1369

"""calculate all the heads of the common ancestors of revs"""

1376

try:

1370

try:

1377

ancs = self.index.commonancestorsheads(*revs)

1371

ancs = self.index.commonancestorsheads(*revs)

1378

except (AttributeError, OverflowError): # C implementation failed

1372

except (AttributeError, OverflowError): # C implementation failed

1379

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

1373

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

1380

return ancs

1374

return ancs

1381

1375

1382

def isancestor(self, a, b):

1376

def isancestor(self, a, b):

1383

"""return True if node a is an ancestor of node b

1377

"""return True if node a is an ancestor of node b

1384

1378

1385

A revision is considered an ancestor of itself."""

1379

A revision is considered an ancestor of itself."""

1386

a, b = self.rev(a), self.rev(b)

1380

a, b = self.rev(a), self.rev(b)

1387

return self.isancestorrev(a, b)

1381

return self.isancestorrev(a, b)

1388

1382

1389

def isancestorrev(self, a, b):

1383

def isancestorrev(self, a, b):

1390

"""return True if revision a is an ancestor of revision b

1384

"""return True if revision a is an ancestor of revision b

1391

1385

1392

A revision is considered an ancestor of itself.

1386

A revision is considered an ancestor of itself.

1393

1387

1394

The implementation of this is trivial but the use of

1388

The implementation of this is trivial but the use of

1395

reachableroots is not."""

1389

reachableroots is not."""

1396

if a == nullrev:

1390

if a == nullrev:

1397

return True

1391

return True

1398

elif a == b:

1392

elif a == b:

1399

return True

1393

return True

1400

elif a > b:

1394

elif a > b:

1401

return False

1395

return False

1402

return bool(self.reachableroots(a, [b], [a], includepath=False))

1396

return bool(self.reachableroots(a, [b], [a], includepath=False))

1403

1397

1404

def reachableroots(self, minroot, heads, roots, includepath=False):

1398

def reachableroots(self, minroot, heads, roots, includepath=False):

1405

"""return (heads(::(<roots> and <roots>::<heads>)))

1399

"""return (heads(::(<roots> and <roots>::<heads>)))

1406

1400

1407

If includepath is True, return (<roots>::<heads>)."""

1401

If includepath is True, return (<roots>::<heads>)."""

1408

try:

1402

try:

1409

return self.index.reachableroots2(

1403

return self.index.reachableroots2(

1410

minroot, heads, roots, includepath

1404

minroot, heads, roots, includepath

1411

)

1405

)

1412

except AttributeError:

1406

except AttributeError:

1413

return dagop._reachablerootspure(

1407

return dagop._reachablerootspure(

1414

self.parentrevs, minroot, roots, heads, includepath

1408

self.parentrevs, minroot, roots, heads, includepath

1415

)

1409

)

1416

1410

1417

def ancestor(self, a, b):

1411

def ancestor(self, a, b):

1418

"""calculate the "best" common ancestor of nodes a and b"""

1412

"""calculate the "best" common ancestor of nodes a and b"""

1419

1413

1420

a, b = self.rev(a), self.rev(b)

1414

a, b = self.rev(a), self.rev(b)

1421

try:

1415

try:

1422

ancs = self.index.ancestors(a, b)

1416

ancs = self.index.ancestors(a, b)

1423

except (AttributeError, OverflowError):

1417

except (AttributeError, OverflowError):

1424

ancs = ancestor.ancestors(self.parentrevs, a, b)

1418

ancs = ancestor.ancestors(self.parentrevs, a, b)

1425

if ancs:

1419

if ancs:

1426

# choose a consistent winner when there's a tie

1420

# choose a consistent winner when there's a tie

1427

return min(map(self.node, ancs))

1421

return min(map(self.node, ancs))

1428

return nullid

1422

return nullid

1429

1423

1430

def _match(self, id):

1424

def _match(self, id):

1431

if isinstance(id, int):

1425

if isinstance(id, int):

1432

# rev

1426

# rev

1433

return self.node(id)

1427

return self.node(id)

1434

if len(id) == 20:

1428

if len(id) == 20:

1435

# possibly a binary node

1429

# possibly a binary node

1436

# odds of a binary node being all hex in ASCII are 1 in 10**25

1430

# odds of a binary node being all hex in ASCII are 1 in 10**25

1437

try:

1431

try:

1438

node = id

1432

node = id

1439

self.rev(node) # quick search the index

1433

self.rev(node) # quick search the index

1440

return node

1434

return node

1441

except error.LookupError:

1435

except error.LookupError:

1442

pass # may be partial hex id

1436

pass # may be partial hex id

1443

try:

1437

try:

1444

# str(rev)

1438

# str(rev)

1445

rev = int(id)

1439

rev = int(id)

1446

if b"%d" % rev != id:

1440

if b"%d" % rev != id:

1447

raise ValueError

1441

raise ValueError

1448

if rev < 0:

1442

if rev < 0:

1449

rev = len(self) + rev

1443

rev = len(self) + rev

1450

if rev < 0 or rev >= len(self):

1444

if rev < 0 or rev >= len(self):

1451

raise ValueError

1445

raise ValueError

1452

return self.node(rev)

1446

return self.node(rev)

1453

except (ValueError, OverflowError):

1447

except (ValueError, OverflowError):

1454

pass

1448

pass

1455

if len(id) == 40:

1449

if len(id) == 40:

1456

try:

1450

try:

1457

# a full hex nodeid?

1451

# a full hex nodeid?

1458

node = bin(id)

1452

node = bin(id)

1459

self.rev(node)

1453

self.rev(node)

1460

return node

1454

return node

1461

except (TypeError, error.LookupError):

1455

except (TypeError, error.LookupError):

1462

pass

1456

pass

1463

1457

1464

def _partialmatch(self, id):

1458

def _partialmatch(self, id):

1465

# we don't care wdirfilenodeids as they should be always full hash

1459

# we don't care wdirfilenodeids as they should be always full hash

1466

maybewdir = wdirhex.startswith(id)

1460

maybewdir = wdirhex.startswith(id)

1467

try:

1461

try:

1468

partial = self.index.partialmatch(id)

1462

partial = self.index.partialmatch(id)

1469

if partial and self.hasnode(partial):

1463

if partial and self.hasnode(partial):

1470

if maybewdir:

1464

if maybewdir:

1471

# single 'ff...' match in radix tree, ambiguous with wdir

1465

# single 'ff...' match in radix tree, ambiguous with wdir

1472

raise error.RevlogError

1466

raise error.RevlogError

1473

return partial

1467

return partial

1474

if maybewdir:

1468

if maybewdir:

1475

# no 'ff...' match in radix tree, wdir identified

1469

# no 'ff...' match in radix tree, wdir identified

1476

raise error.WdirUnsupported

1470

raise error.WdirUnsupported

1477

return None

1471

return None

1478

except error.RevlogError:

1472

except error.RevlogError:

1479

# parsers.c radix tree lookup gave multiple matches

1473

# parsers.c radix tree lookup gave multiple matches

1480

# fast path: for unfiltered changelog, radix tree is accurate

1474

# fast path: for unfiltered changelog, radix tree is accurate

1481

if not getattr(self, 'filteredrevs', None):

1475

if not getattr(self, 'filteredrevs', None):

1482

raise error.AmbiguousPrefixLookupError(

1476

raise error.AmbiguousPrefixLookupError(

1483

id, self.indexfile, _(b'ambiguous identifier')

1477

id, self.indexfile, _(b'ambiguous identifier')

1484

)

1478

)

1485

# fall through to slow path that filters hidden revisions

1479

# fall through to slow path that filters hidden revisions

1486

except (AttributeError, ValueError):

1480

except (AttributeError, ValueError):

1487

# we are pure python, or key was too short to search radix tree

1481

# we are pure python, or key was too short to search radix tree

1488

pass

1482

pass

1489

1483

1490

if id in self._pcache:

1484

if id in self._pcache:

1491

return self._pcache[id]

1485

return self._pcache[id]

1492

1486

1493

if len(id) <= 40:

1487

if len(id) <= 40:

1494

try:

1488

try:

1495

# hex(node)[:...]

1489

# hex(node)[:...]

1496

l = len(id) // 2 # grab an even number of digits

1490

l = len(id) // 2 # grab an even number of digits

1497

prefix = bin(id[: l * 2])

1491

prefix = bin(id[: l * 2])

1498

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

1492

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

1499

nl = [

1493

nl = [

1500

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

1494

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

1501

]

1495

]

1502

if nullhex.startswith(id):

1496

if nullhex.startswith(id):

1503

nl.append(nullid)

1497

nl.append(nullid)

1504

if len(nl) > 0:

1498

if len(nl) > 0:

1505

if len(nl) == 1 and not maybewdir:

1499

if len(nl) == 1 and not maybewdir:

1506

self._pcache[id] = nl[0]

1500

self._pcache[id] = nl[0]

1507

return nl[0]

1501

return nl[0]

1508

raise error.AmbiguousPrefixLookupError(

1502

raise error.AmbiguousPrefixLookupError(

1509

id, self.indexfile, _(b'ambiguous identifier')

1503

id, self.indexfile, _(b'ambiguous identifier')

1510

)

1504

)

1511

if maybewdir:

1505

if maybewdir:

1512

raise error.WdirUnsupported

1506

raise error.WdirUnsupported

1513

return None

1507

return None

1514

except TypeError:

1508

except TypeError:

1515

pass

1509

pass

1516

1510

1517

def lookup(self, id):

1511

def lookup(self, id):

1518

"""locate a node based on:

1512

"""locate a node based on:

1519

- revision number or str(revision number)

1513

- revision number or str(revision number)

1520

- nodeid or subset of hex nodeid

1514

- nodeid or subset of hex nodeid

1521

"""

1515

"""

1522

n = self._match(id)

1516

n = self._match(id)

1523

if n is not None:

1517

if n is not None:

1524

return n

1518

return n

1525

n = self._partialmatch(id)

1519

n = self._partialmatch(id)

1526

if n:

1520

if n:

1527

return n

1521

return n

1528

1522

1529

raise error.LookupError(id, self.indexfile, _(b'no match found'))

1523

raise error.LookupError(id, self.indexfile, _(b'no match found'))

1530

1524

1531

def shortest(self, node, minlength=1):

1525

def shortest(self, node, minlength=1):

1532

"""Find the shortest unambiguous prefix that matches node."""

1526

"""Find the shortest unambiguous prefix that matches node."""

1533

1527

1534

def isvalid(prefix):

1528

def isvalid(prefix):

1535

try:

1529

try:

1536

matchednode = self._partialmatch(prefix)

1530

matchednode = self._partialmatch(prefix)

1537

except error.AmbiguousPrefixLookupError:

1531

except error.AmbiguousPrefixLookupError:

1538

return False

1532

return False

1539

except error.WdirUnsupported:

1533

except error.WdirUnsupported:

1540

# single 'ff...' match

1534

# single 'ff...' match

1541

return True

1535

return True

1542

if matchednode is None:

1536

if matchednode is None:

1543

raise error.LookupError(node, self.indexfile, _(b'no node'))

1537

raise error.LookupError(node, self.indexfile, _(b'no node'))

1544

return True

1538

return True

1545

1539

1546

def maybewdir(prefix):

1540

def maybewdir(prefix):

1547

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

1541

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

1548

1542

1549

hexnode = hex(node)

1543

hexnode = hex(node)

1550

1544

1551

def disambiguate(hexnode, minlength):

1545

def disambiguate(hexnode, minlength):

1552

"""Disambiguate against wdirid."""

1546

"""Disambiguate against wdirid."""

1553

for length in range(minlength, len(hexnode) + 1):

1547

for length in range(minlength, len(hexnode) + 1):

1554

prefix = hexnode[:length]

1548

prefix = hexnode[:length]

1555

if not maybewdir(prefix):

1549

if not maybewdir(prefix):

1556

return prefix

1550

return prefix

1557

1551

1558

if not getattr(self, 'filteredrevs', None):

1552

if not getattr(self, 'filteredrevs', None):

1559

try:

1553

try:

1560

length = max(self.index.shortest(node), minlength)

1554

length = max(self.index.shortest(node), minlength)

1561

return disambiguate(hexnode, length)

1555

return disambiguate(hexnode, length)

1562

except error.RevlogError:

1556

except error.RevlogError:

1563

if node != wdirid:

1557

if node != wdirid:

1564

raise error.LookupError(node, self.indexfile, _(b'no node'))

1558

raise error.LookupError(node, self.indexfile, _(b'no node'))

1565

except AttributeError:

1559

except AttributeError:

1566

# Fall through to pure code

1560

# Fall through to pure code

1567

pass

1561

pass

1568

1562

1569

if node == wdirid:

1563

if node == wdirid:

1570

for length in range(minlength, len(hexnode) + 1):

1564

for length in range(minlength, len(hexnode) + 1):

1571

prefix = hexnode[:length]

1565

prefix = hexnode[:length]

1572

if isvalid(prefix):

1566

if isvalid(prefix):

1573

return prefix

1567

return prefix

1574

1568

1575

for length in range(minlength, len(hexnode) + 1):

1569

for length in range(minlength, len(hexnode) + 1):

1576

prefix = hexnode[:length]

1570

prefix = hexnode[:length]

1577

if isvalid(prefix):

1571

if isvalid(prefix):

1578

return disambiguate(hexnode, length)

1572

return disambiguate(hexnode, length)

1579

1573

1580

def cmp(self, node, text):

1574

def cmp(self, node, text):

1581

"""compare text with a given file revision

1575

"""compare text with a given file revision

1582

1576

1583

returns True if text is different than what is stored.

1577

returns True if text is different than what is stored.

1584

"""

1578

"""

1585

p1, p2 = self.parents(node)

1579

p1, p2 = self.parents(node)

1586

return storageutil.hashrevisionsha1(text, p1, p2) != node

1580

return storageutil.hashrevisionsha1(text, p1, p2) != node

1587

1581

1588

def _cachesegment(self, offset, data):

1582

def _cachesegment(self, offset, data):

1589

"""Add a segment to the revlog cache.

1583

"""Add a segment to the revlog cache.

1590

1584

1591

Accepts an absolute offset and the data that is at that location.

1585

Accepts an absolute offset and the data that is at that location.

1592

"""

1586

"""

1593

o, d = self._chunkcache

1587

o, d = self._chunkcache

1594

# try to add to existing cache

1588

# try to add to existing cache

1595

if o + len(d) == offset and len(d) + len(data) < _chunksize:

1589

if o + len(d) == offset and len(d) + len(data) < _chunksize:

1596

self._chunkcache = o, d + data

1590

self._chunkcache = o, d + data

1597

else:

1591

else:

1598

self._chunkcache = offset, data

1592

self._chunkcache = offset, data

1599

1593

1600

def _readsegment(self, offset, length, df=None):

1594

def _readsegment(self, offset, length, df=None):

1601

"""Load a segment of raw data from the revlog.

1595

"""Load a segment of raw data from the revlog.

1602

1596

1603

Accepts an absolute offset, length to read, and an optional existing

1597

Accepts an absolute offset, length to read, and an optional existing

1604

file handle to read from.

1598

file handle to read from.

1605

1599

1606

If an existing file handle is passed, it will be seeked and the

1600

If an existing file handle is passed, it will be seeked and the

1607

original seek position will NOT be restored.

1601

original seek position will NOT be restored.

1608

1602

1609

Returns a str or buffer of raw byte data.

1603

Returns a str or buffer of raw byte data.

1610

1604

1611

Raises if the requested number of bytes could not be read.

1605

Raises if the requested number of bytes could not be read.

1612

"""

1606

"""

1613

# Cache data both forward and backward around the requested

1607

# Cache data both forward and backward around the requested

1614

# data, in a fixed size window. This helps speed up operations

1608

# data, in a fixed size window. This helps speed up operations

1615

# involving reading the revlog backwards.

1609

# involving reading the revlog backwards.

1616

cachesize = self._chunkcachesize

1610

cachesize = self._chunkcachesize

1617

realoffset = offset & ~(cachesize - 1)

1611

realoffset = offset & ~(cachesize - 1)

1618

reallength = (

1612

reallength = (

1619

(offset + length + cachesize) & ~(cachesize - 1)

1613

(offset + length + cachesize) & ~(cachesize - 1)

1620

) - realoffset

1614

) - realoffset

1621

with self._datareadfp(df) as df:

1615

with self._datareadfp(df) as df:

1622

df.seek(realoffset)

1616

df.seek(realoffset)

1623

d = df.read(reallength)

1617

d = df.read(reallength)

1624

1618

1625

self._cachesegment(realoffset, d)

1619

self._cachesegment(realoffset, d)

1626

if offset != realoffset or reallength != length:

1620

if offset != realoffset or reallength != length:

1627

startoffset = offset - realoffset

1621

startoffset = offset - realoffset

1628

if len(d) - startoffset < length:

1622

if len(d) - startoffset < length:

1629

raise error.RevlogError(

1623

raise error.RevlogError(

1630

_(

1624

_(

1631

b'partial read of revlog %s; expected %d bytes from '

1625

b'partial read of revlog %s; expected %d bytes from '

1632

b'offset %d, got %d'

1626

b'offset %d, got %d'

1633

)

1627

)

1634

% (

1628

% (

1635

self.indexfile if self._inline else self.datafile,

1629

self.indexfile if self._inline else self.datafile,

1636

length,

1630

length,

1637

realoffset,

1631

realoffset,

1638

len(d) - startoffset,

1632

len(d) - startoffset,

1639

)

1633

)

1640

)

1634

)

1641

1635

1642

return util.buffer(d, startoffset, length)

1636

return util.buffer(d, startoffset, length)

1643

1637

1644

if len(d) < length:

1638

if len(d) < length:

1645

raise error.RevlogError(

1639

raise error.RevlogError(

1646

_(

1640

_(

1647

b'partial read of revlog %s; expected %d bytes from offset '

1641

b'partial read of revlog %s; expected %d bytes from offset '

1648

b'%d, got %d'

1642

b'%d, got %d'

1649

)

1643

)

1650

% (

1644

% (

1651

self.indexfile if self._inline else self.datafile,

1645

self.indexfile if self._inline else self.datafile,

1652

length,

1646

length,

1653

offset,

1647

offset,

1654

len(d),

1648

len(d),

1655

)

1649

)

1656

)

1650

)

1657

1651

1658

return d

1652

return d

1659

1653

1660

def _getsegment(self, offset, length, df=None):

1654

def _getsegment(self, offset, length, df=None):

1661

"""Obtain a segment of raw data from the revlog.

1655

"""Obtain a segment of raw data from the revlog.

1662

1656

1663

Accepts an absolute offset, length of bytes to obtain, and an

1657

Accepts an absolute offset, length of bytes to obtain, and an

1664

optional file handle to the already-opened revlog. If the file

1658

optional file handle to the already-opened revlog. If the file

1665

handle is used, it's original seek position will not be preserved.

1659

handle is used, it's original seek position will not be preserved.

1666

1660

1667

Requests for data may be returned from a cache.

1661

Requests for data may be returned from a cache.

1668

1662

1669

Returns a str or a buffer instance of raw byte data.

1663

Returns a str or a buffer instance of raw byte data.

1670

"""

1664

"""

1671

o, d = self._chunkcache

1665

o, d = self._chunkcache

1672

l = len(d)

1666

l = len(d)

1673

1667

1674

# is it in the cache?

1668

# is it in the cache?

1675

cachestart = offset - o

1669

cachestart = offset - o

1676

cacheend = cachestart + length

1670

cacheend = cachestart + length

1677

if cachestart >= 0 and cacheend <= l:

1671

if cachestart >= 0 and cacheend <= l:

1678

if cachestart == 0 and cacheend == l:

1672

if cachestart == 0 and cacheend == l:

1679

return d # avoid a copy

1673

return d # avoid a copy

1680

return util.buffer(d, cachestart, cacheend - cachestart)

1674

return util.buffer(d, cachestart, cacheend - cachestart)

1681

1675

1682

return self._readsegment(offset, length, df=df)

1676

return self._readsegment(offset, length, df=df)

1683

1677

1684

def _getsegmentforrevs(self, startrev, endrev, df=None):

1678

def _getsegmentforrevs(self, startrev, endrev, df=None):

1685

"""Obtain a segment of raw data corresponding to a range of revisions.

1679

"""Obtain a segment of raw data corresponding to a range of revisions.

1686

1680

1687

Accepts the start and end revisions and an optional already-open

1681

Accepts the start and end revisions and an optional already-open

1688

file handle to be used for reading. If the file handle is read, its

1682

file handle to be used for reading. If the file handle is read, its

1689

seek position will not be preserved.

1683

seek position will not be preserved.

1690

1684

1691

Requests for data may be satisfied by a cache.

1685

Requests for data may be satisfied by a cache.

1692

1686

1693

Returns a 2-tuple of (offset, data) for the requested range of

1687

Returns a 2-tuple of (offset, data) for the requested range of

1694

revisions. Offset is the integer offset from the beginning of the

1688

revisions. Offset is the integer offset from the beginning of the

1695

revlog and data is a str or buffer of the raw byte data.

1689

revlog and data is a str or buffer of the raw byte data.

1696

1690

1697

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

1691

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

1698

to determine where each revision's data begins and ends.

1692

to determine where each revision's data begins and ends.

1699

"""

1693

"""

1700

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

1694

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

1701

# (functions are expensive).

1695

# (functions are expensive).

1702

index = self.index

1696

index = self.index

1703

istart = index[startrev]

1697

istart = index[startrev]

1704

start = int(istart[0] >> 16)

1698

start = int(istart[0] >> 16)

1705

if startrev == endrev:

1699

if startrev == endrev:

1706

end = start + istart[1]

1700

end = start + istart[1]

1707

else:

1701

else:

1708

iend = index[endrev]

1702

iend = index[endrev]

1709

end = int(iend[0] >> 16) + iend[1]

1703

end = int(iend[0] >> 16) + iend[1]

1710

1704

1711

if self._inline:

1705

if self._inline:

1712

start += (startrev + 1) * self.index.entry_size

1706

start += (startrev + 1) * self.index.entry_size

1713

end += (endrev + 1) * self.index.entry_size

1707

end += (endrev + 1) * self.index.entry_size

1714

length = end - start

1708

length = end - start

1715

1709

1716

return start, self._getsegment(start, length, df=df)

1710

return start, self._getsegment(start, length, df=df)

1717

1711

1718

def _chunk(self, rev, df=None):

1712

def _chunk(self, rev, df=None):

1719

"""Obtain a single decompressed chunk for a revision.

1713

"""Obtain a single decompressed chunk for a revision.

1720

1714

1721

Accepts an integer revision and an optional already-open file handle

1715

Accepts an integer revision and an optional already-open file handle

1722

to be used for reading. If used, the seek position of the file will not

1716

to be used for reading. If used, the seek position of the file will not

1723

be preserved.

1717

be preserved.

1724

1718

1725

Returns a str holding uncompressed data for the requested revision.

1719

Returns a str holding uncompressed data for the requested revision.

1726

"""

1720

"""

1727

return self.decompress(self._getsegmentforrevs(rev, rev, df=df)[1])

1721

return self.decompress(self._getsegmentforrevs(rev, rev, df=df)[1])

1728

1722

1729

def _chunks(self, revs, df=None, targetsize=None):

1723

def _chunks(self, revs, df=None, targetsize=None):

1730

"""Obtain decompressed chunks for the specified revisions.

1724

"""Obtain decompressed chunks for the specified revisions.

1731

1725

1732

Accepts an iterable of numeric revisions that are assumed to be in

1726

Accepts an iterable of numeric revisions that are assumed to be in

1733

ascending order. Also accepts an optional already-open file handle

1727

ascending order. Also accepts an optional already-open file handle

1734

to be used for reading. If used, the seek position of the file will

1728

to be used for reading. If used, the seek position of the file will

1735

not be preserved.

1729

not be preserved.

1736

1730

1737

This function is similar to calling ``self._chunk()`` multiple times,

1731

This function is similar to calling ``self._chunk()`` multiple times,

1738

but is faster.

1732

but is faster.

1739

1733

1740

Returns a list with decompressed data for each requested revision.

1734

Returns a list with decompressed data for each requested revision.

1741

"""

1735

"""

1742

if not revs:

1736

if not revs:

1743

return []

1737

return []

1744

start = self.start

1738

start = self.start

1745

length = self.length

1739

length = self.length

1746

inline = self._inline

1740

inline = self._inline

1747

iosize = self.index.entry_size

1741

iosize = self.index.entry_size

1748

buffer = util.buffer

1742

buffer = util.buffer

1749

1743

1750

l = []

1744

l = []

1751

ladd = l.append

1745

ladd = l.append

1752

1746

1753

if not self._withsparseread:

1747

if not self._withsparseread:

1754

slicedchunks = (revs,)

1748

slicedchunks = (revs,)

1755

else:

1749

else:

1756

slicedchunks = deltautil.slicechunk(

1750

slicedchunks = deltautil.slicechunk(

1757

self, revs, targetsize=targetsize

1751

self, revs, targetsize=targetsize

1758

)

1752

)

1759

1753

1760

for revschunk in slicedchunks:

1754

for revschunk in slicedchunks:

1761

firstrev = revschunk[0]

1755

firstrev = revschunk[0]

1762

# Skip trailing revisions with empty diff

1756

# Skip trailing revisions with empty diff

1763

for lastrev in revschunk[::-1]:

1757

for lastrev in revschunk[::-1]:

1764

if length(lastrev) != 0:

1758

if length(lastrev) != 0:

1765

break

1759

break

1766

1760

1767

try:

1761

try:

1768

offset, data = self._getsegmentforrevs(firstrev, lastrev, df=df)

1762

offset, data = self._getsegmentforrevs(firstrev, lastrev, df=df)

1769

except OverflowError:

1763

except OverflowError:

1770

# issue4215 - we can't cache a run of chunks greater than

1764

# issue4215 - we can't cache a run of chunks greater than

1771

# 2G on Windows

1765

# 2G on Windows

1772

return [self._chunk(rev, df=df) for rev in revschunk]

1766

return [self._chunk(rev, df=df) for rev in revschunk]

1773

1767

1774

decomp = self.decompress

1768

decomp = self.decompress

1775

for rev in revschunk:

1769

for rev in revschunk:

1776

chunkstart = start(rev)

1770

chunkstart = start(rev)

1777

if inline:

1771

if inline:

1778

chunkstart += (rev + 1) * iosize

1772

chunkstart += (rev + 1) * iosize

1779

chunklength = length(rev)

1773

chunklength = length(rev)

1780

ladd(decomp(buffer(data, chunkstart - offset, chunklength)))

1774

ladd(decomp(buffer(data, chunkstart - offset, chunklength)))

1781

1775

1782

return l

1776

return l

1783

1777

1784

def _chunkclear(self):

1778

def _chunkclear(self):

1785

"""Clear the raw chunk cache."""

1779

"""Clear the raw chunk cache."""

1786

self._chunkcache = (0, b'')

1780

self._chunkcache = (0, b'')

1787

1781

1788

def deltaparent(self, rev):

1782

def deltaparent(self, rev):

1789

"""return deltaparent of the given revision"""

1783

"""return deltaparent of the given revision"""

1790

base = self.index[rev][3]

1784

base = self.index[rev][3]

1791

if base == rev:

1785

if base == rev:

1792

return nullrev

1786

return nullrev

1793

elif self._generaldelta:

1787

elif self._generaldelta:

1794

return base

1788

return base

1795

else:

1789

else:

1796

return rev - 1

1790

return rev - 1

1797

1791

1798

def issnapshot(self, rev):

1792

def issnapshot(self, rev):

1799

"""tells whether rev is a snapshot"""

1793

"""tells whether rev is a snapshot"""

1800

if not self._sparserevlog:

1794

if not self._sparserevlog:

1801

return self.deltaparent(rev) == nullrev

1795

return self.deltaparent(rev) == nullrev

1802

elif util.safehasattr(self.index, b'issnapshot'):

1796

elif util.safehasattr(self.index, b'issnapshot'):

1803

# directly assign the method to cache the testing and access

1797

# directly assign the method to cache the testing and access

1804

self.issnapshot = self.index.issnapshot

1798

self.issnapshot = self.index.issnapshot

1805

return self.issnapshot(rev)

1799

return self.issnapshot(rev)

1806

if rev == nullrev:

1800

if rev == nullrev:

1807

return True

1801

return True

1808

entry = self.index[rev]

1802

entry = self.index[rev]

1809

base = entry[3]

1803

base = entry[3]

1810

if base == rev:

1804

if base == rev:

1811

return True

1805

return True

1812

if base == nullrev:

1806

if base == nullrev:

1813

return True

1807

return True

1814

p1 = entry[5]

1808

p1 = entry[5]

1815

p2 = entry[6]

1809

p2 = entry[6]

1816

if base == p1 or base == p2:

1810

if base == p1 or base == p2:

1817

return False

1811

return False

1818

return self.issnapshot(base)

1812

return self.issnapshot(base)

1819

1813

1820

def snapshotdepth(self, rev):

1814

def snapshotdepth(self, rev):

1821

"""number of snapshot in the chain before this one"""

1815

"""number of snapshot in the chain before this one"""

1822

if not self.issnapshot(rev):

1816

if not self.issnapshot(rev):

1823

raise error.ProgrammingError(b'revision %d not a snapshot')

1817

raise error.ProgrammingError(b'revision %d not a snapshot')

1824

return len(self._deltachain(rev)[0]) - 1

1818

return len(self._deltachain(rev)[0]) - 1

1825

1819

1826

def revdiff(self, rev1, rev2):

1820

def revdiff(self, rev1, rev2):

1827

"""return or calculate a delta between two revisions

1821

"""return or calculate a delta between two revisions

1828

1822

1829

The delta calculated is in binary form and is intended to be written to

1823

The delta calculated is in binary form and is intended to be written to

1830

revlog data directly. So this function needs raw revision data.

1824

revlog data directly. So this function needs raw revision data.

1831

"""

1825

"""

1832

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

1826

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

1833

return bytes(self._chunk(rev2))

1827

return bytes(self._chunk(rev2))

1834

1828

1835

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

1829

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

1836

1830

1837

def _processflags(self, text, flags, operation, raw=False):

1831

def _processflags(self, text, flags, operation, raw=False):

1838

"""deprecated entry point to access flag processors"""

1832

"""deprecated entry point to access flag processors"""

1839

msg = b'_processflag(...) use the specialized variant'

1833

msg = b'_processflag(...) use the specialized variant'

1840

util.nouideprecwarn(msg, b'5.2', stacklevel=2)

1834

util.nouideprecwarn(msg, b'5.2', stacklevel=2)

1841

if raw:

1835

if raw:

1842

return text, flagutil.processflagsraw(self, text, flags)

1836

return text, flagutil.processflagsraw(self, text, flags)

1843

elif operation == b'read':

1837

elif operation == b'read':

1844

return flagutil.processflagsread(self, text, flags)

1838

return flagutil.processflagsread(self, text, flags)

1845

else: # write operation

1839

else: # write operation

1846

return flagutil.processflagswrite(self, text, flags)

1840

return flagutil.processflagswrite(self, text, flags)

1847

1841

1848

def revision(self, nodeorrev, _df=None, raw=False):

1842

def revision(self, nodeorrev, _df=None, raw=False):

1849

"""return an uncompressed revision of a given node or revision

1843

"""return an uncompressed revision of a given node or revision

1850

number.

1844

number.

1851

1845

1852

_df - an existing file handle to read from. (internal-only)

1846

_df - an existing file handle to read from. (internal-only)

1853

raw - an optional argument specifying if the revision data is to be

1847

raw - an optional argument specifying if the revision data is to be

1854

treated as raw data when applying flag transforms. 'raw' should be set

1848

treated as raw data when applying flag transforms. 'raw' should be set

1855

to True when generating changegroups or in debug commands.

1849

to True when generating changegroups or in debug commands.

1856

"""

1850

"""

1857

if raw:

1851

if raw:

1858

msg = (

1852

msg = (

1859

b'revlog.revision(..., raw=True) is deprecated, '

1853

b'revlog.revision(..., raw=True) is deprecated, '

1860

b'use revlog.rawdata(...)'

1854

b'use revlog.rawdata(...)'

1861

)

1855

)

1862

util.nouideprecwarn(msg, b'5.2', stacklevel=2)

1856

util.nouideprecwarn(msg, b'5.2', stacklevel=2)

1863

return self._revisiondata(nodeorrev, _df, raw=raw)[0]

1857

return self._revisiondata(nodeorrev, _df, raw=raw)[0]

1864

1858

1865

def sidedata(self, nodeorrev, _df=None):

1859

def sidedata(self, nodeorrev, _df=None):

1866

"""a map of extra data related to the changeset but not part of the hash

1860

"""a map of extra data related to the changeset but not part of the hash

1867

1861

1868

This function currently return a dictionary. However, more advanced

1862

This function currently return a dictionary. However, more advanced

1869

mapping object will likely be used in the future for a more

1863

mapping object will likely be used in the future for a more

1870

efficient/lazy code.

1864

efficient/lazy code.

1871

"""

1865

"""

1872

return self._revisiondata(nodeorrev, _df)[1]

1866

return self._revisiondata(nodeorrev, _df)[1]

1873

1867

1874

def _revisiondata(self, nodeorrev, _df=None, raw=False):

1868

def _revisiondata(self, nodeorrev, _df=None, raw=False):

1875

# deal with <nodeorrev> argument type

1869

# deal with <nodeorrev> argument type

1876

if isinstance(nodeorrev, int):

1870

if isinstance(nodeorrev, int):

1877

rev = nodeorrev

1871

rev = nodeorrev

1878

node = self.node(rev)

1872

node = self.node(rev)

1879

else:

1873

else:

1880

node = nodeorrev

1874

node = nodeorrev

1881

rev = None

1875

rev = None

1882

1876

1883

# fast path the special `nullid` rev

1877

# fast path the special `nullid` rev

1884

if node == nullid:

1878

if node == nullid:

1885

return b"", {}

1879

return b"", {}

1886

1880

1887

# ``rawtext`` is the text as stored inside the revlog. Might be the

1881

# ``rawtext`` is the text as stored inside the revlog. Might be the

1888

# revision or might need to be processed to retrieve the revision.

1882

# revision or might need to be processed to retrieve the revision.

1889

rev, rawtext, validated = self._rawtext(node, rev, _df=_df)

1883

rev, rawtext, validated = self._rawtext(node, rev, _df=_df)

1890

1884

1891

if self.version & 0xFFFF == REVLOGV2:

1885

if self.version & 0xFFFF == REVLOGV2:

1892

if rev is None:

1886

if rev is None:

1893

rev = self.rev(node)

1887

rev = self.rev(node)

1894

sidedata = self._sidedata(rev)

1888

sidedata = self._sidedata(rev)

1895

else:

1889

else:

1896

sidedata = {}

1890

sidedata = {}

1897

1891

1898

if raw and validated:

1892

if raw and validated:

1899

# if we don't want to process the raw text and that raw

1893

# if we don't want to process the raw text and that raw

1900

# text is cached, we can exit early.

1894

# text is cached, we can exit early.

1901

return rawtext, sidedata

1895

return rawtext, sidedata

1902

if rev is None:

1896

if rev is None:

1903

rev = self.rev(node)

1897

rev = self.rev(node)

1904

# the revlog's flag for this revision

1898

# the revlog's flag for this revision

1905

# (usually alter its state or content)

1899

# (usually alter its state or content)

1906

flags = self.flags(rev)

1900

flags = self.flags(rev)

1907

1901

1908

if validated and flags == REVIDX_DEFAULT_FLAGS:

1902

if validated and flags == REVIDX_DEFAULT_FLAGS:

1909

# no extra flags set, no flag processor runs, text = rawtext

1903

# no extra flags set, no flag processor runs, text = rawtext

1910

return rawtext, sidedata

1904

return rawtext, sidedata

1911

1905

1912

if raw:

1906

if raw:

1913

validatehash = flagutil.processflagsraw(self, rawtext, flags)

1907

validatehash = flagutil.processflagsraw(self, rawtext, flags)

1914

text = rawtext

1908

text = rawtext

1915

else:

1909

else:

1916

r = flagutil.processflagsread(self, rawtext, flags)

1910

r = flagutil.processflagsread(self, rawtext, flags)

1917

text, validatehash = r

1911

text, validatehash = r

1918

if validatehash:

1912

if validatehash:

1919

self.checkhash(text, node, rev=rev)

1913

self.checkhash(text, node, rev=rev)

1920

if not validated:

1914

if not validated:

1921

self._revisioncache = (node, rev, rawtext)

1915

self._revisioncache = (node, rev, rawtext)

1922

1916

1923

return text, sidedata

1917

return text, sidedata

1924

1918

1925

def _rawtext(self, node, rev, _df=None):

1919

def _rawtext(self, node, rev, _df=None):

1926

"""return the possibly unvalidated rawtext for a revision

1920

"""return the possibly unvalidated rawtext for a revision

1927

1921

1928

returns (rev, rawtext, validated)

1922

returns (rev, rawtext, validated)

1929

"""

1923

"""

1930

1924

1931

# revision in the cache (could be useful to apply delta)

1925

# revision in the cache (could be useful to apply delta)

1932

cachedrev = None

1926

cachedrev = None

1933

# An intermediate text to apply deltas to

1927

# An intermediate text to apply deltas to

1934

basetext = None

1928

basetext = None

1935

1929

1936

# Check if we have the entry in cache

1930

# Check if we have the entry in cache

1937

# The cache entry looks like (node, rev, rawtext)

1931

# The cache entry looks like (node, rev, rawtext)

1938

if self._revisioncache:

1932

if self._revisioncache:

1939

if self._revisioncache[0] == node:

1933

if self._revisioncache[0] == node:

1940

return (rev, self._revisioncache[2], True)

1934

return (rev, self._revisioncache[2], True)

1941

cachedrev = self._revisioncache[1]

1935

cachedrev = self._revisioncache[1]

1942

1936

1943

if rev is None:

1937

if rev is None:

1944

rev = self.rev(node)

1938

rev = self.rev(node)

1945

1939

1946

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

1940

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

1947

if stopped:

1941

if stopped:

1948

basetext = self._revisioncache[2]

1942

basetext = self._revisioncache[2]

1949

1943

1950

# drop cache to save memory, the caller is expected to

1944

# drop cache to save memory, the caller is expected to

1951

# update self._revisioncache after validating the text

1945

# update self._revisioncache after validating the text

1952

self._revisioncache = None

1946

self._revisioncache = None

1953

1947

1954

targetsize = None

1948

targetsize = None

1955

rawsize = self.index[rev][2]

1949

rawsize = self.index[rev][2]

1956

if 0 <= rawsize:

1950

if 0 <= rawsize:

1957

targetsize = 4 * rawsize

1951

targetsize = 4 * rawsize

1958

1952

1959

bins = self._chunks(chain, df=_df, targetsize=targetsize)

1953

bins = self._chunks(chain, df=_df, targetsize=targetsize)

1960

if basetext is None:

1954

if basetext is None:

1961

basetext = bytes(bins[0])

1955

basetext = bytes(bins[0])

1962

bins = bins[1:]

1956

bins = bins[1:]

1963

1957

1964

rawtext = mdiff.patches(basetext, bins)

1958

rawtext = mdiff.patches(basetext, bins)

1965

del basetext # let us have a chance to free memory early

1959

del basetext # let us have a chance to free memory early

1966

return (rev, rawtext, False)

1960

return (rev, rawtext, False)

1967

1961

1968

def _sidedata(self, rev):

1962

def _sidedata(self, rev):

1969

"""Return the sidedata for a given revision number."""

1963

"""Return the sidedata for a given revision number."""

1970

index_entry = self.index[rev]

1964

index_entry = self.index[rev]

1971

sidedata_offset = index_entry[8]

1965

sidedata_offset = index_entry[8]

1972

sidedata_size = index_entry[9]

1966

sidedata_size = index_entry[9]

1973

1967

1974

if self._inline:

1968

if self._inline:

1975

sidedata_offset += self.index.entry_size * (1 + rev)

1969

sidedata_offset += self.index.entry_size * (1 + rev)

1976

if sidedata_size == 0:

1970

if sidedata_size == 0:

1977

return {}

1971

return {}

1978

1972

1979

segment = self._getsegment(sidedata_offset, sidedata_size)

1973

segment = self._getsegment(sidedata_offset, sidedata_size)

1980

sidedata = sidedatautil.deserialize_sidedata(segment)

1974

sidedata = sidedatautil.deserialize_sidedata(segment)

1981

return sidedata

1975

return sidedata

1982

1976

1983

def rawdata(self, nodeorrev, _df=None):

1977

def rawdata(self, nodeorrev, _df=None):

1984

"""return an uncompressed raw data of a given node or revision number.

1978

"""return an uncompressed raw data of a given node or revision number.

1985

1979

1986

_df - an existing file handle to read from. (internal-only)

1980

_df - an existing file handle to read from. (internal-only)

1987

"""

1981

"""

1988

return self._revisiondata(nodeorrev, _df, raw=True)[0]

1982

return self._revisiondata(nodeorrev, _df, raw=True)[0]

1989

1983

1990

def hash(self, text, p1, p2):

1984

def hash(self, text, p1, p2):

1991

"""Compute a node hash.

1985

"""Compute a node hash.

1992

1986

1993

Available as a function so that subclasses can replace the hash

1987

Available as a function so that subclasses can replace the hash

1994

as needed.

1988

as needed.

1995

"""

1989

"""

1996

return storageutil.hashrevisionsha1(text, p1, p2)

1990

return storageutil.hashrevisionsha1(text, p1, p2)

1997

1991

1998

def checkhash(self, text, node, p1=None, p2=None, rev=None):

1992

def checkhash(self, text, node, p1=None, p2=None, rev=None):

1999

"""Check node hash integrity.

1993

"""Check node hash integrity.

2000

1994

2001

Available as a function so that subclasses can extend hash mismatch

1995

Available as a function so that subclasses can extend hash mismatch

2002

behaviors as needed.

1996

behaviors as needed.

2003

"""

1997

"""

2004

try:

1998

try:

2005

if p1 is None and p2 is None:

1999

if p1 is None and p2 is None:

2006

p1, p2 = self.parents(node)

2000

p1, p2 = self.parents(node)

2007

if node != self.hash(text, p1, p2):

2001

if node != self.hash(text, p1, p2):

2008

# Clear the revision cache on hash failure. The revision cache

2002

# Clear the revision cache on hash failure. The revision cache

2009

# only stores the raw revision and clearing the cache does have

2003

# only stores the raw revision and clearing the cache does have

2010

# the side-effect that we won't have a cache hit when the raw

2004

# the side-effect that we won't have a cache hit when the raw

2011

# revision data is accessed. But this case should be rare and

2005

# revision data is accessed. But this case should be rare and

2012

# it is extra work to teach the cache about the hash

2006

# it is extra work to teach the cache about the hash

2013

# verification state.

2007

# verification state.

2014

if self._revisioncache and self._revisioncache[0] == node:

2008

if self._revisioncache and self._revisioncache[0] == node:

2015

self._revisioncache = None

2009

self._revisioncache = None

2016

2010

2017

revornode = rev

2011

revornode = rev

2018

if revornode is None:

2012

if revornode is None:

2019

revornode = templatefilters.short(hex(node))

2013

revornode = templatefilters.short(hex(node))

2020

raise error.RevlogError(

2014

raise error.RevlogError(

2021

_(b"integrity check failed on %s:%s")

2015

_(b"integrity check failed on %s:%s")

2022

% (self.indexfile, pycompat.bytestr(revornode))

2016

% (self.indexfile, pycompat.bytestr(revornode))

2023

)

2017

)

2024

except error.RevlogError:

2018

except error.RevlogError:

2025

if self._censorable and storageutil.iscensoredtext(text):

2019

if self._censorable and storageutil.iscensoredtext(text):

2026

raise error.CensoredNodeError(self.indexfile, node, text)

2020

raise error.CensoredNodeError(self.indexfile, node, text)

2027

raise

2021

raise

2028

2022

2029

def _enforceinlinesize(self, tr, fp=None):

2023

def _enforceinlinesize(self, tr, fp=None):

2030

"""Check if the revlog is too big for inline and convert if so.

2024

"""Check if the revlog is too big for inline and convert if so.

2031

2025

2032

This should be called after revisions are added to the revlog. If the

2026

This should be called after revisions are added to the revlog. If the

2033

revlog has grown too large to be an inline revlog, it will convert it

2027

revlog has grown too large to be an inline revlog, it will convert it

2034

to use multiple index and data files.

2028

to use multiple index and data files.

2035

"""

2029

"""

2036

tiprev = len(self) - 1

2030

tiprev = len(self) - 1

2037

if (

2031

if (

2038

not self._inline

2032

not self._inline

2039

or (self.start(tiprev) + self.length(tiprev)) < _maxinline

2033

or (self.start(tiprev) + self.length(tiprev)) < _maxinline

2040

):

2034

):

2041

return

2035

return

2042

2036

2043

troffset = tr.findoffset(self.indexfile)

2037

troffset = tr.findoffset(self.indexfile)

2044

if troffset is None:

2038

if troffset is None:

2045

raise error.RevlogError(

2039

raise error.RevlogError(

2046

_(b"%s not found in the transaction") % self.indexfile

2040

_(b"%s not found in the transaction") % self.indexfile

2047

)

2041

)

2048

trindex = 0

2042

trindex = 0

2049

tr.add(self.datafile, 0)

2043

tr.add(self.datafile, 0)

2050

2044

2051

if fp:

2045

if fp:

2052

fp.flush()

2046

fp.flush()

2053

fp.close()

2047

fp.close()

2054

# We can't use the cached file handle after close(). So prevent

2048

# We can't use the cached file handle after close(). So prevent

2055

# its usage.

2049

# its usage.

2056

self._writinghandles = None

2050

self._writinghandles = None

2057

2051

2058

with self._indexfp(b'r') as ifh, self._datafp(b'w') as dfh:

2052

with self._indexfp(b'r') as ifh, self._datafp(b'w') as dfh:

2059

for r in self:

2053

for r in self:

2060

dfh.write(self._getsegmentforrevs(r, r, df=ifh)[1])

2054

dfh.write(self._getsegmentforrevs(r, r, df=ifh)[1])

2061

if troffset <= self.start(r):

2055

if troffset <= self.start(r):

2062

trindex = r

2056

trindex = r

2063

2057

2064

with self._indexfp(b'w') as fp:

2058

with self._indexfp(b'w') as fp:

2065

self.version &= ~FLAG_INLINE_DATA

2059

self.version &= ~FLAG_INLINE_DATA

2066

self._inline = False

2060

self._inline = False

2067

io = self._io

2061

io = self._io

2068

for i in self:

2062

for i in self:

2069

e = io.packentry(self.index[i], self.node, self.version, i)

2063

e = io.packentry(self.index[i], self.node, self.version, i)

2070

fp.write(e)

2064

fp.write(e)

2071

2065

2072

# the temp file replace the real index when we exit the context

2066

# the temp file replace the real index when we exit the context

2073

# manager

2067

# manager

2074

2068

2075

tr.replace(self.indexfile, trindex * self.index.entry_size)

2069

tr.replace(self.indexfile, trindex * self.index.entry_size)

2076

nodemaputil.setup_persistent_nodemap(tr, self)

2070

nodemaputil.setup_persistent_nodemap(tr, self)

2077

self._chunkclear()

2071

self._chunkclear()

2078

2072

2079

def _nodeduplicatecallback(self, transaction, node):

2073

def _nodeduplicatecallback(self, transaction, node):

2080

"""called when trying to add a node already stored."""

2074

"""called when trying to add a node already stored."""

2081

2075

2082

def addrevision(

2076

def addrevision(

2083

self,

2077

self,

2084

text,

2078

text,

2085

transaction,

2079

transaction,

2086

link,

2080

link,

2087

p1,

2081

p1,

2088

p2,

2082

p2,

2089

cachedelta=None,

2083

cachedelta=None,

2090

node=None,

2084

node=None,

2091

flags=REVIDX_DEFAULT_FLAGS,

2085

flags=REVIDX_DEFAULT_FLAGS,

2092

deltacomputer=None,

2086

deltacomputer=None,

2093

sidedata=None,

2087

sidedata=None,

2094

):

2088

):

2095

"""add a revision to the log

2089

"""add a revision to the log

2096

2090

2097

text - the revision data to add

2091

text - the revision data to add

2098

transaction - the transaction object used for rollback

2092

transaction - the transaction object used for rollback

2099

link - the linkrev data to add

2093

link - the linkrev data to add

2100

p1, p2 - the parent nodeids of the revision

2094

p1, p2 - the parent nodeids of the revision

2101

cachedelta - an optional precomputed delta

2095

cachedelta - an optional precomputed delta

2102

node - nodeid of revision; typically node is not specified, and it is

2096

node - nodeid of revision; typically node is not specified, and it is

2103

computed by default as hash(text, p1, p2), however subclasses might

2097

computed by default as hash(text, p1, p2), however subclasses might

2104

use different hashing method (and override checkhash() in such case)

2098

use different hashing method (and override checkhash() in such case)

2105

flags - the known flags to set on the revision

2099

flags - the known flags to set on the revision

2106

deltacomputer - an optional deltacomputer instance shared between

2100

deltacomputer - an optional deltacomputer instance shared between

2107

multiple calls

2101

multiple calls

2108

"""

2102

"""

2109

if link == nullrev:

2103

if link == nullrev:

2110

raise error.RevlogError(

2104

raise error.RevlogError(

2111

_(b"attempted to add linkrev -1 to %s") % self.indexfile

2105

_(b"attempted to add linkrev -1 to %s") % self.indexfile

2112

)

2106

)

2113

2107

2114

if sidedata is None:

2108

if sidedata is None:

2115

sidedata = {}

2109

sidedata = {}

2116

elif not self.hassidedata:

2110

elif not self.hassidedata:

2117

raise error.ProgrammingError(

2111

raise error.ProgrammingError(

2118

_(b"trying to add sidedata to a revlog who don't support them")

2112

_(b"trying to add sidedata to a revlog who don't support them")

2119

)

2113

)

2120

2114

2121

if flags:

2115

if flags:

2122

node = node or self.hash(text, p1, p2)

2116

node = node or self.hash(text, p1, p2)

2123

2117

2124

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2118

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2125

2119

2126

# If the flag processor modifies the revision data, ignore any provided

2120

# If the flag processor modifies the revision data, ignore any provided

2127

# cachedelta.

2121

# cachedelta.

2128

if rawtext != text:

2122

if rawtext != text:

2129

cachedelta = None

2123

cachedelta = None

2130

2124

2131

if len(rawtext) > _maxentrysize:

2125

if len(rawtext) > _maxentrysize:

2132

raise error.RevlogError(

2126

raise error.RevlogError(

2133

_(

2127

_(

2134

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2128

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2135

)

2129

)

2136

% (self.indexfile, len(rawtext))

2130

% (self.indexfile, len(rawtext))

2137

)

2131

)

2138

2132

2139

node = node or self.hash(rawtext, p1, p2)

2133

node = node or self.hash(rawtext, p1, p2)

2140

rev = self.index.get_rev(node)

2134

rev = self.index.get_rev(node)

2141

if rev is not None:

2135

if rev is not None:

2142

return rev

2136

return rev

2143

2137

2144

if validatehash:

2138

if validatehash:

2145

self.checkhash(rawtext, node, p1=p1, p2=p2)

2139

self.checkhash(rawtext, node, p1=p1, p2=p2)

2146

2140

2147

return self.addrawrevision(

2141

return self.addrawrevision(

2148

rawtext,

2142

rawtext,

2149

transaction,

2143

transaction,

2150

link,

2144

link,

2151

p1,

2145

p1,

2152

p2,

2146

p2,

2153

node,

2147

node,

2154

flags,

2148

flags,

2155

cachedelta=cachedelta,

2149

cachedelta=cachedelta,

2156

deltacomputer=deltacomputer,

2150

deltacomputer=deltacomputer,

2157

sidedata=sidedata,

2151

sidedata=sidedata,

2158

)

2152

)

2159

2153

2160

def addrawrevision(

2154

def addrawrevision(

2161

self,

2155

self,

2162

rawtext,

2156

rawtext,

2163

transaction,

2157

transaction,

2164

link,

2158

link,

2165

p1,

2159

p1,

2166

p2,

2160

p2,

2167

node,

2161

node,

2168

flags,

2162

flags,

2169

cachedelta=None,

2163

cachedelta=None,

2170

deltacomputer=None,

2164

deltacomputer=None,

2171

sidedata=None,

2165

sidedata=None,

2172

):

2166

):

2173

"""add a raw revision with known flags, node and parents

2167

"""add a raw revision with known flags, node and parents

2174

useful when reusing a revision not stored in this revlog (ex: received

2168

useful when reusing a revision not stored in this revlog (ex: received

2175

over wire, or read from an external bundle).

2169

over wire, or read from an external bundle).

2176

"""

2170

"""

2177

dfh = None

2171

dfh = None

2178

if not self._inline:

2172

if not self._inline:

2179

dfh = self._datafp(b"a+")

2173

dfh = self._datafp(b"a+")

2180

ifh = self._indexfp(b"a+")

2174

ifh = self._indexfp(b"a+")

2181

try:

2175

try:

2182

return self._addrevision(

2176

return self._addrevision(

2183

node,

2177

node,

2184

rawtext,

2178

rawtext,

2185

transaction,

2179

transaction,

2186

link,

2180

link,

2187

p1,

2181

p1,

2188

p2,

2182

p2,

2189

flags,

2183

flags,

2190

cachedelta,

2184

cachedelta,

2191

ifh,

2185

ifh,

2192

dfh,

2186

dfh,

2193

deltacomputer=deltacomputer,

2187

deltacomputer=deltacomputer,

2194

sidedata=sidedata,

2188

sidedata=sidedata,

2195

)

2189

)

2196

finally:

2190

finally:

2197

if dfh:

2191

if dfh:

2198

dfh.close()

2192

dfh.close()

2199

ifh.close()

2193

ifh.close()

2200

2194

2201

def compress(self, data):

2195

def compress(self, data):

2202

"""Generate a possibly-compressed representation of data."""

2196

"""Generate a possibly-compressed representation of data."""

2203

if not data:

2197

if not data:

2204

return b'', data

2198

return b'', data

2205

2199

2206

compressed = self._compressor.compress(data)

2200

compressed = self._compressor.compress(data)

2207

2201

2208

if compressed:

2202

if compressed:

2209

# The revlog compressor added the header in the returned data.

2203

# The revlog compressor added the header in the returned data.

2210

return b'', compressed

2204

return b'', compressed

2211

2205

2212

if data[0:1] == b'\0':

2206

if data[0:1] == b'\0':

2213

return b'', data

2207

return b'', data

2214

return b'u', data

2208

return b'u', data

2215

2209

2216

def decompress(self, data):

2210

def decompress(self, data):

2217

"""Decompress a revlog chunk.

2211

"""Decompress a revlog chunk.

2218

2212

2219

The chunk is expected to begin with a header identifying the

2213

The chunk is expected to begin with a header identifying the

2220

format type so it can be routed to an appropriate decompressor.

2214

format type so it can be routed to an appropriate decompressor.

2221

"""

2215

"""

2222

if not data:

2216

if not data:

2223

return data

2217

return data

2224

2218

2225

# Revlogs are read much more frequently than they are written and many

2219

# Revlogs are read much more frequently than they are written and many

2226

# chunks only take microseconds to decompress, so performance is

2220

# chunks only take microseconds to decompress, so performance is

2227

# important here.

2221

# important here.

2228

#

2222

#

2229

# We can make a few assumptions about revlogs:

2223

# We can make a few assumptions about revlogs:

2230

#

2224

#

2231

# 1) the majority of chunks will be compressed (as opposed to inline

2225

# 1) the majority of chunks will be compressed (as opposed to inline

2232

# raw data).

2226

# raw data).

2233

# 2) decompressing *any* data will likely by at least 10x slower than

2227

# 2) decompressing *any* data will likely by at least 10x slower than

2234

# returning raw inline data.

2228

# returning raw inline data.

2235

# 3) we want to prioritize common and officially supported compression

2229

# 3) we want to prioritize common and officially supported compression

2236

# engines

2230

# engines

2237

#

2231

#

2238

# It follows that we want to optimize for "decompress compressed data

2232

# It follows that we want to optimize for "decompress compressed data

2239

# when encoded with common and officially supported compression engines"

2233

# when encoded with common and officially supported compression engines"

2240

# case over "raw data" and "data encoded by less common or non-official

2234

# case over "raw data" and "data encoded by less common or non-official

2241

# compression engines." That is why we have the inline lookup first

2235

# compression engines." That is why we have the inline lookup first

2242

# followed by the compengines lookup.

2236

# followed by the compengines lookup.

2243

#

2237

#

2244

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

2238

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

2245

# compressed chunks. And this matters for changelog and manifest reads.

2239

# compressed chunks. And this matters for changelog and manifest reads.

2246

t = data[0:1]

2240

t = data[0:1]

2247

2241

2248

if t == b'x':

2242

if t == b'x':

2249

try:

2243

try:

2250

return _zlibdecompress(data)

2244

return _zlibdecompress(data)

2251

except zlib.error as e:

2245

except zlib.error as e:

2252

raise error.RevlogError(

2246

raise error.RevlogError(

2253

_(b'revlog decompress error: %s')

2247

_(b'revlog decompress error: %s')

2254

% stringutil.forcebytestr(e)

2248

% stringutil.forcebytestr(e)

2255

)

2249

)

2256

# '\0' is more common than 'u' so it goes first.

2250

# '\0' is more common than 'u' so it goes first.

2257

elif t == b'\0':

2251

elif t == b'\0':

2258

return data

2252

return data

2259

elif t == b'u':

2253

elif t == b'u':

2260

return util.buffer(data, 1)

2254

return util.buffer(data, 1)

2261

2255

2262

try:

2256

try:

2263

compressor = self._decompressors[t]

2257

compressor = self._decompressors[t]

2264

except KeyError:

2258

except KeyError:

2265

try:

2259

try:

2266

engine = util.compengines.forrevlogheader(t)

2260

engine = util.compengines.forrevlogheader(t)

2267

compressor = engine.revlogcompressor(self._compengineopts)

2261

compressor = engine.revlogcompressor(self._compengineopts)

2268

self._decompressors[t] = compressor

2262

self._decompressors[t] = compressor

2269

except KeyError:

2263

except KeyError:

2270

raise error.RevlogError(

2264

raise error.RevlogError(

2271

_(b'unknown compression type %s') % binascii.hexlify(t)

2265

_(b'unknown compression type %s') % binascii.hexlify(t)

2272

)

2266

)

2273

2267

2274

return compressor.decompress(data)

2268

return compressor.decompress(data)

2275

2269

2276

def _addrevision(

2270

def _addrevision(

2277

self,

2271

self,

2278

node,

2272

node,

2279

rawtext,

2273

rawtext,

2280

transaction,

2274

transaction,

2281

link,

2275

link,

2282

p1,

2276

p1,

2283

p2,

2277

p2,

2284

flags,

2278

flags,

2285

cachedelta,

2279

cachedelta,

2286

ifh,

2280

ifh,

2287

dfh,

2281

dfh,

2288

alwayscache=False,

2282

alwayscache=False,

2289

deltacomputer=None,

2283

deltacomputer=None,

2290

sidedata=None,

2284

sidedata=None,

2291

):

2285

):

2292

"""internal function to add revisions to the log

2286

"""internal function to add revisions to the log

2293

2287

2294

see addrevision for argument descriptions.

2288

see addrevision for argument descriptions.

2295

2289

2296

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

2290

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

2297

2291

2298

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

2292

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

2299

be used.

2293

be used.

2300

2294

2301

invariants:

2295

invariants:

2302

- rawtext is optional (can be None); if not set, cachedelta must be set.

2296

- rawtext is optional (can be None); if not set, cachedelta must be set.

2303

if both are set, they must correspond to each other.

2297

if both are set, they must correspond to each other.

2304

"""

2298

"""

2305

if node == nullid:

2299

if node == nullid:

2306

raise error.RevlogError(

2300

raise error.RevlogError(

2307

_(b"%s: attempt to add null revision") % self.indexfile

2301

_(b"%s: attempt to add null revision") % self.indexfile

2308

)

2302

)

2309

if node == wdirid or node in wdirfilenodeids:

2303

if node == wdirid or node in wdirfilenodeids:

2310

raise error.RevlogError(

2304

raise error.RevlogError(

2311

_(b"%s: attempt to add wdir revision") % self.indexfile

2305

_(b"%s: attempt to add wdir revision") % self.indexfile

2312

)

2306

)

2313

2307

2314

if self._inline:

2308

if self._inline:

2315

fh = ifh

2309

fh = ifh

2316

else:

2310

else:

2317

fh = dfh

2311

fh = dfh

2318

2312

2319

btext = [rawtext]

2313

btext = [rawtext]

2320

2314

2321

curr = len(self)

2315

curr = len(self)

2322

prev = curr - 1

2316

prev = curr - 1

2323

2317

2324

offset = self._get_data_offset(prev)

2318

offset = self._get_data_offset(prev)

2325

2319

2326

if self._concurrencychecker:

2320

if self._concurrencychecker:

2327

if self._inline:

2321

if self._inline:

2328

# offset is "as if" it were in the .d file, so we need to add on

2322

# offset is "as if" it were in the .d file, so we need to add on

2329

# the size of the entry metadata.

2323

# the size of the entry metadata.

2330

self._concurrencychecker(

2324

self._concurrencychecker(

2331

ifh, self.indexfile, offset + curr * self.index.entry_size

2325

ifh, self.indexfile, offset + curr * self.index.entry_size

2332

)

2326

)

2333

else:

2327

else:

2334

# Entries in the .i are a consistent size.

2328

# Entries in the .i are a consistent size.

2335

self._concurrencychecker(

2329

self._concurrencychecker(

2336

ifh, self.indexfile, curr * self.index.entry_size

2330

ifh, self.indexfile, curr * self.index.entry_size

2337

)

2331

)

2338

self._concurrencychecker(dfh, self.datafile, offset)

2332

self._concurrencychecker(dfh, self.datafile, offset)

2339

2333

2340

p1r, p2r = self.rev(p1), self.rev(p2)

2334

p1r, p2r = self.rev(p1), self.rev(p2)

2341

2335

2342

# full versions are inserted when the needed deltas

2336

# full versions are inserted when the needed deltas

2343

# become comparable to the uncompressed text

2337

# become comparable to the uncompressed text

2344

if rawtext is None:

2338

if rawtext is None:

2345

# need rawtext size, before changed by flag processors, which is

2339

# need rawtext size, before changed by flag processors, which is

2346

# the non-raw size. use revlog explicitly to avoid filelog's extra

2340

# the non-raw size. use revlog explicitly to avoid filelog's extra

2347

# logic that might remove metadata size.

2341

# logic that might remove metadata size.

2348

textlen = mdiff.patchedsize(

2342

textlen = mdiff.patchedsize(

2349

revlog.size(self, cachedelta[0]), cachedelta[1]

2343

revlog.size(self, cachedelta[0]), cachedelta[1]

2350

)

2344

)

2351

else:

2345

else:

2352

textlen = len(rawtext)

2346

textlen = len(rawtext)

2353

2347

2354

if deltacomputer is None:

2348

if deltacomputer is None:

2355

deltacomputer = deltautil.deltacomputer(self)

2349

deltacomputer = deltautil.deltacomputer(self)

2356

2350

2357

revinfo = _revisioninfo(node, p1, p2, btext, textlen, cachedelta, flags)

2351

revinfo = _revisioninfo(node, p1, p2, btext, textlen, cachedelta, flags)

2358

2352

2359

deltainfo = deltacomputer.finddeltainfo(revinfo, fh)

2353

deltainfo = deltacomputer.finddeltainfo(revinfo, fh)

2360

2354

2361

if sidedata:

2355

if sidedata:

2362

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

2356

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

2363

sidedata_offset = offset + deltainfo.deltalen

2357

sidedata_offset = offset + deltainfo.deltalen

2364

else:

2358

else:

2365

serialized_sidedata = b""

2359

serialized_sidedata = b""

2366

# Don't store the offset if the sidedata is empty, that way

2360

# Don't store the offset if the sidedata is empty, that way

2367

# we can easily detect empty sidedata and they will be no different

2361

# we can easily detect empty sidedata and they will be no different

2368

# than ones we manually add.

2362

# than ones we manually add.

2369

sidedata_offset = 0

2363

sidedata_offset = 0

2370

2364

2371

e = (

2365

e = (

2372

offset_type(offset, flags),

2366

offset_type(offset, flags),

2373

deltainfo.deltalen,

2367

deltainfo.deltalen,

2374

textlen,

2368

textlen,

2375

deltainfo.base,

2369

deltainfo.base,

2376

link,

2370

link,

2377

p1r,

2371

p1r,

2378

p2r,

2372

p2r,

2379

node,

2373

node,

2380

sidedata_offset,

2374

sidedata_offset,

2381

len(serialized_sidedata),

2375

len(serialized_sidedata),

2382

)

2376

)

2383

2377

2384

if self.version & 0xFFFF != REVLOGV2:

2378

if self.version & 0xFFFF != REVLOGV2:

2385

e = e[:8]

2379

e = e[:8]

2386

2380

2387

self.index.append(e)

2381

self.index.append(e)

2388

entry = self._io.packentry(e, self.node, self.version, curr)

2382

entry = self._io.packentry(e, self.node, self.version, curr)

2389

self._writeentry(

2383

self._writeentry(

2390

transaction,

2384

transaction,

2391

ifh,

2385

ifh,

2392

dfh,

2386

dfh,

2393

entry,

2387

entry,

2394

deltainfo.data,

2388

deltainfo.data,

2395

link,

2389

link,

2396

offset,

2390

offset,

2397

serialized_sidedata,

2391

serialized_sidedata,

2398

)

2392

)

2399

2393

2400

rawtext = btext[0]

2394

rawtext = btext[0]

2401

2395

2402

if alwayscache and rawtext is None:

2396

if alwayscache and rawtext is None:

2403

rawtext = deltacomputer.buildtext(revinfo, fh)

2397

rawtext = deltacomputer.buildtext(revinfo, fh)

2404

2398

2405

if type(rawtext) == bytes: # only accept immutable objects

2399

if type(rawtext) == bytes: # only accept immutable objects

2406

self._revisioncache = (node, curr, rawtext)

2400

self._revisioncache = (node, curr, rawtext)

2407

self._chainbasecache[curr] = deltainfo.chainbase

2401

self._chainbasecache[curr] = deltainfo.chainbase

2408

return curr

2402

return curr

2409

2403

2410

def _get_data_offset(self, prev):

2404

def _get_data_offset(self, prev):

2411

"""Returns the current offset in the (in-transaction) data file.

2405

"""Returns the current offset in the (in-transaction) data file.

2412

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

2406

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

2413

file to store that information: since sidedata can be rewritten to the

2407

file to store that information: since sidedata can be rewritten to the

2414

end of the data file within a transaction, you can have cases where, for

2408

end of the data file within a transaction, you can have cases where, for

2415

example, rev `n` does not have sidedata while rev `n - 1` does, leading

2409

example, rev `n` does not have sidedata while rev `n - 1` does, leading

2416

to `n - 1`'s sidedata being written after `n`'s data.

2410

to `n - 1`'s sidedata being written after `n`'s data.

2417

2411

2418

TODO cache this in a docket file before getting out of experimental."""

2412

TODO cache this in a docket file before getting out of experimental."""

2419

if self.version & 0xFFFF != REVLOGV2:

2413

if self.version & 0xFFFF != REVLOGV2:

2420

return self.end(prev)

2414

return self.end(prev)

2421

2415

2422

offset = 0

2416

offset = 0

2423

for rev, entry in enumerate(self.index):

2417

for rev, entry in enumerate(self.index):

2424

sidedata_end = entry[8] + entry[9]

2418

sidedata_end = entry[8] + entry[9]

2425

# Sidedata for a previous rev has potentially been written after

2419

# Sidedata for a previous rev has potentially been written after

2426

# this rev's end, so take the max.

2420

# this rev's end, so take the max.

2427

offset = max(self.end(rev), offset, sidedata_end)

2421

offset = max(self.end(rev), offset, sidedata_end)

2428

return offset

2422

return offset

2429

2423

2430

def _writeentry(

2424

def _writeentry(

2431

self, transaction, ifh, dfh, entry, data, link, offset, sidedata

2425

self, transaction, ifh, dfh, entry, data, link, offset, sidedata

2432

):

2426

):

2433

# Files opened in a+ mode have inconsistent behavior on various

2427

# Files opened in a+ mode have inconsistent behavior on various

2434

# platforms. Windows requires that a file positioning call be made

2428

# platforms. Windows requires that a file positioning call be made

2435

# when the file handle transitions between reads and writes. See

2429

# when the file handle transitions between reads and writes. See

2436

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

2430

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

2437

# platforms, Python or the platform itself can be buggy. Some versions

2431

# platforms, Python or the platform itself can be buggy. Some versions

2438

# of Solaris have been observed to not append at the end of the file

2432

# of Solaris have been observed to not append at the end of the file

2439

# if the file was seeked to before the end. See issue4943 for more.

2433

# if the file was seeked to before the end. See issue4943 for more.

2440

#

2434

#

2441

# We work around this issue by inserting a seek() before writing.

2435

# We work around this issue by inserting a seek() before writing.

2442

# Note: This is likely not necessary on Python 3. However, because

2436

# Note: This is likely not necessary on Python 3. However, because

2443

# the file handle is reused for reads and may be seeked there, we need

2437

# the file handle is reused for reads and may be seeked there, we need

2444

# to be careful before changing this.

2438

# to be careful before changing this.

2445

ifh.seek(0, os.SEEK_END)

2439

ifh.seek(0, os.SEEK_END)

2446

if dfh:

2440

if dfh:

2447

dfh.seek(0, os.SEEK_END)

2441

dfh.seek(0, os.SEEK_END)

2448

2442

2449

curr = len(self) - 1

2443

curr = len(self) - 1

2450

if not self._inline:

2444

if not self._inline:

2451

transaction.add(self.datafile, offset)

2445

transaction.add(self.datafile, offset)

2452

transaction.add(self.indexfile, curr * len(entry))

2446

transaction.add(self.indexfile, curr * len(entry))

2453

if data[0]:

2447

if data[0]:

2454

dfh.write(data[0])

2448

dfh.write(data[0])

2455

dfh.write(data[1])

2449

dfh.write(data[1])

2456

if sidedata:

2450

if sidedata:

2457

dfh.write(sidedata)

2451

dfh.write(sidedata)

2458

ifh.write(entry)

2452

ifh.write(entry)

2459

else:

2453

else:

2460

offset += curr * self.index.entry_size

2454

offset += curr * self.index.entry_size

2461

transaction.add(self.indexfile, offset)

2455

transaction.add(self.indexfile, offset)

2462

ifh.write(entry)

2456

ifh.write(entry)

2463

ifh.write(data[0])

2457

ifh.write(data[0])

2464

ifh.write(data[1])

2458

ifh.write(data[1])

2465

if sidedata:

2459

if sidedata:

2466

ifh.write(sidedata)

2460

ifh.write(sidedata)

2467

self._enforceinlinesize(transaction, ifh)

2461

self._enforceinlinesize(transaction, ifh)

2468

nodemaputil.setup_persistent_nodemap(transaction, self)

2462

nodemaputil.setup_persistent_nodemap(transaction, self)

2469

2463

2470

def addgroup(

2464

def addgroup(

2471

self,

2465

self,

2472

deltas,

2466

deltas,

2473

linkmapper,

2467

linkmapper,

2474

transaction,

2468

transaction,

2475

alwayscache=False,

2469

alwayscache=False,

2476

addrevisioncb=None,

2470

addrevisioncb=None,

2477

duplicaterevisioncb=None,

2471

duplicaterevisioncb=None,

2478

):

2472

):

2479

"""

2473

"""

2480

add a delta group

2474

add a delta group

2481

2475

2482

given a set of deltas, add them to the revision log. the

2476

given a set of deltas, add them to the revision log. the

2483

first delta is against its parent, which should be in our

2477

first delta is against its parent, which should be in our

2484

log, the rest are against the previous delta.

2478

log, the rest are against the previous delta.

2485

2479

2486

If ``addrevisioncb`` is defined, it will be called with arguments of

2480

If ``addrevisioncb`` is defined, it will be called with arguments of

2487

this revlog and the node that was added.

2481

this revlog and the node that was added.

2488

"""

2482

"""

2489

2483

2490

if self._writinghandles:

2484

if self._writinghandles:

2491

raise error.ProgrammingError(b'cannot nest addgroup() calls')

2485

raise error.ProgrammingError(b'cannot nest addgroup() calls')

2492

2486

2493

r = len(self)

2487

r = len(self)

2494

end = 0

2488

end = 0

2495

if r:

2489

if r:

2496

end = self.end(r - 1)

2490

end = self.end(r - 1)

2497

ifh = self._indexfp(b"a+")

2491

ifh = self._indexfp(b"a+")

2498

isize = r * self.index.entry_size

2492

isize = r * self.index.entry_size

2499

if self._inline:

2493

if self._inline:

2500

transaction.add(self.indexfile, end + isize)

2494

transaction.add(self.indexfile, end + isize)

2501

dfh = None

2495

dfh = None

2502

else:

2496

else:

2503

transaction.add(self.indexfile, isize)

2497

transaction.add(self.indexfile, isize)

2504

transaction.add(self.datafile, end)

2498

transaction.add(self.datafile, end)

2505

dfh = self._datafp(b"a+")

2499

dfh = self._datafp(b"a+")

2506

2500

2507

def flush():

2501

def flush():

2508

if dfh:

2502

if dfh:

2509

dfh.flush()

2503

dfh.flush()

2510

ifh.flush()

2504

ifh.flush()

2511

2505

2512

self._writinghandles = (ifh, dfh)

2506

self._writinghandles = (ifh, dfh)

2513

empty = True

2507

empty = True

2514

2508

2515

try:

2509

try:

2516

deltacomputer = deltautil.deltacomputer(self)

2510

deltacomputer = deltautil.deltacomputer(self)

2517

# loop through our set of deltas

2511

# loop through our set of deltas

2518

for data in deltas:

2512

for data in deltas:

2519

node, p1, p2, linknode, deltabase, delta, flags, sidedata = data

2513

node, p1, p2, linknode, deltabase, delta, flags, sidedata = data

2520

link = linkmapper(linknode)

2514

link = linkmapper(linknode)

2521

flags = flags or REVIDX_DEFAULT_FLAGS

2515

flags = flags or REVIDX_DEFAULT_FLAGS

2522

2516

2523

rev = self.index.get_rev(node)

2517

rev = self.index.get_rev(node)

2524

if rev is not None:

2518

if rev is not None:

2525

# this can happen if two branches make the same change

2519

# this can happen if two branches make the same change

2526

self._nodeduplicatecallback(transaction, rev)

2520

self._nodeduplicatecallback(transaction, rev)

2527

if duplicaterevisioncb:

2521

if duplicaterevisioncb:

2528

duplicaterevisioncb(self, rev)

2522

duplicaterevisioncb(self, rev)

2529

empty = False

2523

empty = False

2530

continue

2524

continue

2531

2525

2532

for p in (p1, p2):

2526

for p in (p1, p2):

2533

if not self.index.has_node(p):

2527

if not self.index.has_node(p):

2534

raise error.LookupError(

2528

raise error.LookupError(

2535

p, self.indexfile, _(b'unknown parent')

2529

p, self.indexfile, _(b'unknown parent')

2536

)

2530

)

2537

2531

2538

if not self.index.has_node(deltabase):

2532

if not self.index.has_node(deltabase):

2539

raise error.LookupError(

2533

raise error.LookupError(

2540

deltabase, self.indexfile, _(b'unknown delta base')

2534

deltabase, self.indexfile, _(b'unknown delta base')

2541

)

2535

)

2542

2536

2543

baserev = self.rev(deltabase)

2537

baserev = self.rev(deltabase)

2544

2538

2545

if baserev != nullrev and self.iscensored(baserev):

2539

if baserev != nullrev and self.iscensored(baserev):

2546

# if base is censored, delta must be full replacement in a

2540

# if base is censored, delta must be full replacement in a

2547

# single patch operation

2541

# single patch operation

2548

hlen = struct.calcsize(b">lll")

2542

hlen = struct.calcsize(b">lll")

2549

oldlen = self.rawsize(baserev)

2543

oldlen = self.rawsize(baserev)

2550

newlen = len(delta) - hlen

2544

newlen = len(delta) - hlen

2551

if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):

2545

if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):

2552

raise error.CensoredBaseError(

2546

raise error.CensoredBaseError(

2553

self.indexfile, self.node(baserev)

2547

self.indexfile, self.node(baserev)

2554

)

2548

)

2555

2549

2556

if not flags and self._peek_iscensored(baserev, delta, flush):

2550

if not flags and self._peek_iscensored(baserev, delta, flush):

2557

flags |= REVIDX_ISCENSORED

2551

flags |= REVIDX_ISCENSORED

2558

2552

2559

# We assume consumers of addrevisioncb will want to retrieve

2553

# We assume consumers of addrevisioncb will want to retrieve

2560

# the added revision, which will require a call to

2554

# the added revision, which will require a call to

2561

# revision(). revision() will fast path if there is a cache

2555

# revision(). revision() will fast path if there is a cache

2562

# hit. So, we tell _addrevision() to always cache in this case.

2556

# hit. So, we tell _addrevision() to always cache in this case.

2563

# We're only using addgroup() in the context of changegroup

2557

# We're only using addgroup() in the context of changegroup

2564

# generation so the revision data can always be handled as raw

2558

# generation so the revision data can always be handled as raw

2565

# by the flagprocessor.

2559

# by the flagprocessor.

2566

rev = self._addrevision(

2560

rev = self._addrevision(

2567

node,

2561

node,

2568

None,

2562

None,

2569

transaction,

2563

transaction,

2570

link,

2564

link,

2571

p1,

2565

p1,

2572

p2,

2566

p2,

2573

flags,

2567

flags,

2574

(baserev, delta),

2568

(baserev, delta),

2575

ifh,

2569

ifh,

2576

dfh,

2570

dfh,

2577

alwayscache=alwayscache,

2571

alwayscache=alwayscache,

2578

deltacomputer=deltacomputer,

2572

deltacomputer=deltacomputer,

2579

sidedata=sidedata,

2573

sidedata=sidedata,

2580

)

2574

)

2581

2575

2582

if addrevisioncb:

2576

if addrevisioncb:

2583

addrevisioncb(self, rev)

2577

addrevisioncb(self, rev)

2584

empty = False

2578

empty = False

2585

2579

2586

if not dfh and not self._inline:

2580

if not dfh and not self._inline:

2587

# addrevision switched from inline to conventional

2581

# addrevision switched from inline to conventional

2588

# reopen the index

2582

# reopen the index

2589

ifh.close()

2583

ifh.close()

2590

dfh = self._datafp(b"a+")

2584

dfh = self._datafp(b"a+")

2591

ifh = self._indexfp(b"a+")

2585

ifh = self._indexfp(b"a+")

2592

self._writinghandles = (ifh, dfh)

2586

self._writinghandles = (ifh, dfh)

2593

finally:

2587

finally:

2594

self._writinghandles = None

2588

self._writinghandles = None

2595

2589

2596

if dfh:

2590

if dfh:

2597

dfh.close()

2591

dfh.close()

2598

ifh.close()

2592

ifh.close()

2599

return not empty

2593

return not empty

2600

2594

2601

def iscensored(self, rev):

2595

def iscensored(self, rev):

2602

"""Check if a file revision is censored."""

2596

"""Check if a file revision is censored."""

2603

if not self._censorable:

2597

if not self._censorable:

2604

return False

2598

return False

2605

2599

2606

return self.flags(rev) & REVIDX_ISCENSORED

2600

return self.flags(rev) & REVIDX_ISCENSORED

2607

2601

2608

def _peek_iscensored(self, baserev, delta, flush):

2602

def _peek_iscensored(self, baserev, delta, flush):

2609

"""Quickly check if a delta produces a censored revision."""

2603

"""Quickly check if a delta produces a censored revision."""

2610

if not self._censorable:

2604

if not self._censorable:

2611

return False

2605

return False

2612

2606

2613

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

2607

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

2614

2608

2615

def getstrippoint(self, minlink):

2609

def getstrippoint(self, minlink):

2616

"""find the minimum rev that must be stripped to strip the linkrev

2610

"""find the minimum rev that must be stripped to strip the linkrev

2617

2611

2618

Returns a tuple containing the minimum rev and a set of all revs that

2612

Returns a tuple containing the minimum rev and a set of all revs that

2619

have linkrevs that will be broken by this strip.

2613

have linkrevs that will be broken by this strip.

2620

"""

2614

"""

2621

return storageutil.resolvestripinfo(

2615

return storageutil.resolvestripinfo(

2622

minlink,

2616

minlink,

2623

len(self) - 1,

2617

len(self) - 1,

2624

self.headrevs(),

2618

self.headrevs(),

2625

self.linkrev,

2619

self.linkrev,

2626

self.parentrevs,

2620

self.parentrevs,

2627

)

2621

)

2628

2622

2629

def strip(self, minlink, transaction):

2623

def strip(self, minlink, transaction):

2630

"""truncate the revlog on the first revision with a linkrev >= minlink

2624

"""truncate the revlog on the first revision with a linkrev >= minlink

2631

2625

2632

This function is called when we're stripping revision minlink and

2626

This function is called when we're stripping revision minlink and

2633

its descendants from the repository.

2627

its descendants from the repository.

2634

2628

2635

We have to remove all revisions with linkrev >= minlink, because

2629

We have to remove all revisions with linkrev >= minlink, because

2636

the equivalent changelog revisions will be renumbered after the

2630

the equivalent changelog revisions will be renumbered after the

2637

strip.

2631

strip.

2638

2632

2639

So we truncate the revlog on the first of these revisions, and

2633

So we truncate the revlog on the first of these revisions, and

2640

trust that the caller has saved the revisions that shouldn't be

2634

trust that the caller has saved the revisions that shouldn't be

2641

removed and that it'll re-add them after this truncation.

2635

removed and that it'll re-add them after this truncation.

2642

"""

2636

"""

2643

if len(self) == 0:

2637

if len(self) == 0:

2644

return

2638

return

2645

2639

2646

rev, _ = self.getstrippoint(minlink)

2640

rev, _ = self.getstrippoint(minlink)

2647

if rev == len(self):

2641

if rev == len(self):

2648

return

2642

return

2649

2643

2650

# first truncate the files on disk

2644

# first truncate the files on disk

2651

end = self.start(rev)

2645

end = self.start(rev)

2652

if not self._inline:

2646

if not self._inline:

2653

transaction.add(self.datafile, end)

2647

transaction.add(self.datafile, end)

2654

end = rev * self.index.entry_size

2648

end = rev * self.index.entry_size

2655

else:

2649

else:

2656

end += rev * self.index.entry_size

2650

end += rev * self.index.entry_size

2657

2651

2658

transaction.add(self.indexfile, end)

2652

transaction.add(self.indexfile, end)

2659

2653

2660

# then reset internal state in memory to forget those revisions

2654

# then reset internal state in memory to forget those revisions

2661

self._revisioncache = None

2655

self._revisioncache = None

2662

self._chaininfocache = util.lrucachedict(500)

2656

self._chaininfocache = util.lrucachedict(500)

2663

self._chunkclear()

2657

self._chunkclear()

2664

2658

2665

del self.index[rev:-1]

2659

del self.index[rev:-1]

2666

2660

2667

def checksize(self):

2661

def checksize(self):

2668

"""Check size of index and data files

2662

"""Check size of index and data files

2669

2663

2670

return a (dd, di) tuple.

2664

return a (dd, di) tuple.

2671

- dd: extra bytes for the "data" file

2665

- dd: extra bytes for the "data" file

2672

- di: extra bytes for the "index" file

2666

- di: extra bytes for the "index" file

2673

2667

2674

A healthy revlog will return (0, 0).

2668

A healthy revlog will return (0, 0).

2675

"""

2669

"""

2676

expected = 0

2670

expected = 0

2677

if len(self):

2671

if len(self):

2678

expected = max(0, self.end(len(self) - 1))

2672

expected = max(0, self.end(len(self) - 1))

2679

2673

2680

try:

2674

try:

2681

with self._datafp() as f:

2675

with self._datafp() as f:

2682

f.seek(0, io.SEEK_END)

2676

f.seek(0, io.SEEK_END)

2683

actual = f.tell()

2677

actual = f.tell()

2684

dd = actual - expected

2678

dd = actual - expected

2685

except IOError as inst:

2679

except IOError as inst:

2686

if inst.errno != errno.ENOENT:

2680

if inst.errno != errno.ENOENT:

2687

raise

2681

raise

2688

dd = 0

2682

dd = 0

2689

2683

2690

try:

2684

try:

2691

f = self.opener(self.indexfile)

2685

f = self.opener(self.indexfile)

2692

f.seek(0, io.SEEK_END)

2686

f.seek(0, io.SEEK_END)

2693

actual = f.tell()

2687

actual = f.tell()

2694

f.close()

2688

f.close()

2695

s = self.index.entry_size

2689

s = self.index.entry_size

2696

i = max(0, actual // s)

2690

i = max(0, actual // s)

2697

di = actual - (i * s)

2691

di = actual - (i * s)

2698

if self._inline:

2692

if self._inline:

2699

databytes = 0

2693

databytes = 0

2700

for r in self:

2694

for r in self:

2701

databytes += max(0, self.length(r))

2695

databytes += max(0, self.length(r))

2702

dd = 0

2696

dd = 0

2703

di = actual - len(self) * s - databytes

2697

di = actual - len(self) * s - databytes

2704

except IOError as inst:

2698

except IOError as inst:

2705

if inst.errno != errno.ENOENT:

2699

if inst.errno != errno.ENOENT:

2706

raise

2700

raise

2707

di = 0

2701

di = 0

2708

2702

2709

return (dd, di)

2703

return (dd, di)

2710

2704

2711

def files(self):

2705

def files(self):

2712

res = [self.indexfile]

2706

res = [self.indexfile]

2713

if not self._inline:

2707

if not self._inline:

2714

res.append(self.datafile)

2708

res.append(self.datafile)

2715

return res

2709

return res

2716

2710

2717

def emitrevisions(

2711

def emitrevisions(

2718

self,

2712

self,

2719

nodes,

2713

nodes,

2720

nodesorder=None,

2714

nodesorder=None,

2721

revisiondata=False,

2715

revisiondata=False,

2722

assumehaveparentrevisions=False,

2716

assumehaveparentrevisions=False,

2723

deltamode=repository.CG_DELTAMODE_STD,

2717

deltamode=repository.CG_DELTAMODE_STD,

2724

sidedata_helpers=None,

2718

sidedata_helpers=None,

2725

):

2719

):

2726

if nodesorder not in (b'nodes', b'storage', b'linear', None):

2720

if nodesorder not in (b'nodes', b'storage', b'linear', None):

2727

raise error.ProgrammingError(

2721

raise error.ProgrammingError(

2728

b'unhandled value for nodesorder: %s' % nodesorder

2722

b'unhandled value for nodesorder: %s' % nodesorder

2729

)

2723

)

2730

2724

2731

if nodesorder is None and not self._generaldelta:

2725

if nodesorder is None and not self._generaldelta:

2732

nodesorder = b'storage'

2726

nodesorder = b'storage'

2733

2727

2734

if (

2728

if (

2735

not self._storedeltachains

2729

not self._storedeltachains

2736

and deltamode != repository.CG_DELTAMODE_PREV

2730

and deltamode != repository.CG_DELTAMODE_PREV

2737

):

2731

):

2738

deltamode = repository.CG_DELTAMODE_FULL

2732

deltamode = repository.CG_DELTAMODE_FULL

2739

2733

2740

return storageutil.emitrevisions(

2734

return storageutil.emitrevisions(

2741

self,

2735

self,

2742

nodes,

2736

nodes,

2743

nodesorder,

2737

nodesorder,

2744

revlogrevisiondelta,

2738

revlogrevisiondelta,

2745

deltaparentfn=self.deltaparent,

2739

deltaparentfn=self.deltaparent,

2746

candeltafn=self.candelta,

2740

candeltafn=self.candelta,

2747

rawsizefn=self.rawsize,

2741

rawsizefn=self.rawsize,

2748

revdifffn=self.revdiff,

2742

revdifffn=self.revdiff,

2749

flagsfn=self.flags,

2743

flagsfn=self.flags,

2750

deltamode=deltamode,

2744

deltamode=deltamode,

2751

revisiondata=revisiondata,

2745

revisiondata=revisiondata,

2752

assumehaveparentrevisions=assumehaveparentrevisions,

2746

assumehaveparentrevisions=assumehaveparentrevisions,

2753

sidedata_helpers=sidedata_helpers,

2747

sidedata_helpers=sidedata_helpers,

2754

)

2748

)

2755

2749

2756

DELTAREUSEALWAYS = b'always'

2750

DELTAREUSEALWAYS = b'always'

2757

DELTAREUSESAMEREVS = b'samerevs'

2751

DELTAREUSESAMEREVS = b'samerevs'

2758

DELTAREUSENEVER = b'never'

2752

DELTAREUSENEVER = b'never'

2759

2753

2760

DELTAREUSEFULLADD = b'fulladd'

2754

DELTAREUSEFULLADD = b'fulladd'

2761

2755

2762

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

2756

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

2763

2757

2764

def clone(

2758

def clone(

2765

self,

2759

self,

2766

tr,

2760

tr,

2767

destrevlog,

2761

destrevlog,

2768

addrevisioncb=None,

2762

addrevisioncb=None,

2769

deltareuse=DELTAREUSESAMEREVS,

2763

deltareuse=DELTAREUSESAMEREVS,

2770

forcedeltabothparents=None,

2764

forcedeltabothparents=None,

2771

sidedatacompanion=None,

2765

sidedatacompanion=None,

2772

):

2766

):

2773

"""Copy this revlog to another, possibly with format changes.

2767

"""Copy this revlog to another, possibly with format changes.

2774

2768

2775

The destination revlog will contain the same revisions and nodes.

2769

The destination revlog will contain the same revisions and nodes.

2776

However, it may not be bit-for-bit identical due to e.g. delta encoding

2770

However, it may not be bit-for-bit identical due to e.g. delta encoding

2777

differences.

2771

differences.

2778

2772

2779

The ``deltareuse`` argument control how deltas from the existing revlog

2773

The ``deltareuse`` argument control how deltas from the existing revlog

2780

are preserved in the destination revlog. The argument can have the

2774

are preserved in the destination revlog. The argument can have the

2781

following values:

2775

following values:

2782

2776

2783

DELTAREUSEALWAYS

2777

DELTAREUSEALWAYS

2784

Deltas will always be reused (if possible), even if the destination

2778

Deltas will always be reused (if possible), even if the destination

2785

revlog would not select the same revisions for the delta. This is the

2779

revlog would not select the same revisions for the delta. This is the

2786

fastest mode of operation.

2780

fastest mode of operation.

2787

DELTAREUSESAMEREVS

2781

DELTAREUSESAMEREVS

2788

Deltas will be reused if the destination revlog would pick the same

2782

Deltas will be reused if the destination revlog would pick the same

2789

revisions for the delta. This mode strikes a balance between speed

2783

revisions for the delta. This mode strikes a balance between speed

2790

and optimization.

2784

and optimization.

2791

DELTAREUSENEVER

2785

DELTAREUSENEVER

2792

Deltas will never be reused. This is the slowest mode of execution.

2786

Deltas will never be reused. This is the slowest mode of execution.

2793

This mode can be used to recompute deltas (e.g. if the diff/delta

2787

This mode can be used to recompute deltas (e.g. if the diff/delta

2794

algorithm changes).

2788

algorithm changes).

2795

DELTAREUSEFULLADD

2789

DELTAREUSEFULLADD

2796

Revision will be re-added as if their were new content. This is

2790

Revision will be re-added as if their were new content. This is

2797

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

2791

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

2798

eg: large file detection and handling.

2792

eg: large file detection and handling.

2799

2793

2800

Delta computation can be slow, so the choice of delta reuse policy can

2794

Delta computation can be slow, so the choice of delta reuse policy can

2801

significantly affect run time.

2795

significantly affect run time.

2802

2796

2803

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

2797

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

2804

two extremes. Deltas will be reused if they are appropriate. But if the

2798

two extremes. Deltas will be reused if they are appropriate. But if the

2805

delta could choose a better revision, it will do so. This means if you

2799

delta could choose a better revision, it will do so. This means if you

2806

are converting a non-generaldelta revlog to a generaldelta revlog,

2800

are converting a non-generaldelta revlog to a generaldelta revlog,

2807

deltas will be recomputed if the delta's parent isn't a parent of the

2801

deltas will be recomputed if the delta's parent isn't a parent of the

2808

revision.

2802

revision.

2809

2803

2810

In addition to the delta policy, the ``forcedeltabothparents``

2804

In addition to the delta policy, the ``forcedeltabothparents``

2811

argument controls whether to force compute deltas against both parents

2805

argument controls whether to force compute deltas against both parents

2812

for merges. By default, the current default is used.

2806

for merges. By default, the current default is used.

2813

2807

2814

If not None, the `sidedatacompanion` is callable that accept two

2808

If not None, the `sidedatacompanion` is callable that accept two

2815

arguments:

2809

arguments:

2816

2810

2817

(srcrevlog, rev)

2811

(srcrevlog, rev)

2818

2812

2819

and return a quintet that control changes to sidedata content from the

2813

and return a quintet that control changes to sidedata content from the

2820

old revision to the new clone result:

2814

old revision to the new clone result:

2821

2815

2822

(dropall, filterout, update, new_flags, dropped_flags)

2816

(dropall, filterout, update, new_flags, dropped_flags)

2823

2817

2824

* if `dropall` is True, all sidedata should be dropped

2818

* if `dropall` is True, all sidedata should be dropped

2825

* `filterout` is a set of sidedata keys that should be dropped

2819

* `filterout` is a set of sidedata keys that should be dropped

2826

* `update` is a mapping of additionnal/new key -> value

2820

* `update` is a mapping of additionnal/new key -> value

2827

* new_flags is a bitfields of new flags that the revision should get

2821

* new_flags is a bitfields of new flags that the revision should get

2828

* dropped_flags is a bitfields of new flags that the revision shoudl not longer have

2822

* dropped_flags is a bitfields of new flags that the revision shoudl not longer have

2829

"""

2823

"""

2830

if deltareuse not in self.DELTAREUSEALL:

2824

if deltareuse not in self.DELTAREUSEALL:

2831

raise ValueError(

2825

raise ValueError(

2832

_(b'value for deltareuse invalid: %s') % deltareuse

2826

_(b'value for deltareuse invalid: %s') % deltareuse

2833

)

2827

)

2834

2828

2835

if len(destrevlog):

2829

if len(destrevlog):

2836

raise ValueError(_(b'destination revlog is not empty'))

2830

raise ValueError(_(b'destination revlog is not empty'))

2837

2831

2838

if getattr(self, 'filteredrevs', None):

2832

if getattr(self, 'filteredrevs', None):

2839

raise ValueError(_(b'source revlog has filtered revisions'))

2833

raise ValueError(_(b'source revlog has filtered revisions'))

2840

if getattr(destrevlog, 'filteredrevs', None):

2834

if getattr(destrevlog, 'filteredrevs', None):

2841

raise ValueError(_(b'destination revlog has filtered revisions'))

2835

raise ValueError(_(b'destination revlog has filtered revisions'))

2842

2836

2843

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

2837

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

2844

# if possible.

2838

# if possible.

2845

oldlazydelta = destrevlog._lazydelta

2839

oldlazydelta = destrevlog._lazydelta

2846

oldlazydeltabase = destrevlog._lazydeltabase

2840

oldlazydeltabase = destrevlog._lazydeltabase

2847

oldamd = destrevlog._deltabothparents

2841

oldamd = destrevlog._deltabothparents

2848

2842

2849

try:

2843

try:

2850

if deltareuse == self.DELTAREUSEALWAYS:

2844

if deltareuse == self.DELTAREUSEALWAYS:

2851

destrevlog._lazydeltabase = True

2845

destrevlog._lazydeltabase = True

2852

destrevlog._lazydelta = True

2846

destrevlog._lazydelta = True

2853

elif deltareuse == self.DELTAREUSESAMEREVS:

2847

elif deltareuse == self.DELTAREUSESAMEREVS:

2854

destrevlog._lazydeltabase = False

2848

destrevlog._lazydeltabase = False

2855

destrevlog._lazydelta = True

2849

destrevlog._lazydelta = True

2856

elif deltareuse == self.DELTAREUSENEVER:

2850

elif deltareuse == self.DELTAREUSENEVER:

2857

destrevlog._lazydeltabase = False

2851

destrevlog._lazydeltabase = False

2858

destrevlog._lazydelta = False

2852

destrevlog._lazydelta = False

2859

2853

2860

destrevlog._deltabothparents = forcedeltabothparents or oldamd

2854

destrevlog._deltabothparents = forcedeltabothparents or oldamd

2861

2855

2862

self._clone(

2856

self._clone(

2863

tr,

2857

tr,

2864

destrevlog,

2858

destrevlog,

2865

addrevisioncb,

2859

addrevisioncb,

2866

deltareuse,

2860

deltareuse,

2867

forcedeltabothparents,

2861

forcedeltabothparents,

2868

sidedatacompanion,

2862

sidedatacompanion,

2869

)

2863

)

2870

2864

2871

finally:

2865

finally:

2872

destrevlog._lazydelta = oldlazydelta

2866

destrevlog._lazydelta = oldlazydelta

2873

destrevlog._lazydeltabase = oldlazydeltabase

2867

destrevlog._lazydeltabase = oldlazydeltabase

2874

destrevlog._deltabothparents = oldamd

2868

destrevlog._deltabothparents = oldamd

2875

2869

2876

def _clone(

2870

def _clone(

2877

self,

2871

self,

2878

tr,

2872

tr,

2879

destrevlog,

2873

destrevlog,

2880

addrevisioncb,

2874

addrevisioncb,

2881

deltareuse,

2875

deltareuse,

2882

forcedeltabothparents,

2876

forcedeltabothparents,

2883

sidedatacompanion,

2877

sidedatacompanion,

2884

):

2878

):

2885

"""perform the core duty of `revlog.clone` after parameter processing"""

2879

"""perform the core duty of `revlog.clone` after parameter processing"""

2886

deltacomputer = deltautil.deltacomputer(destrevlog)

2880

deltacomputer = deltautil.deltacomputer(destrevlog)

2887

index = self.index

2881

index = self.index

2888

for rev in self:

2882

for rev in self:

2889

entry = index[rev]

2883

entry = index[rev]

2890

2884

2891

# Some classes override linkrev to take filtered revs into

2885

# Some classes override linkrev to take filtered revs into

2892

# account. Use raw entry from index.

2886

# account. Use raw entry from index.

2893

flags = entry[0] & 0xFFFF

2887

flags = entry[0] & 0xFFFF

2894

linkrev = entry[4]

2888

linkrev = entry[4]

2895

p1 = index[entry[5]][7]

2889

p1 = index[entry[5]][7]

2896

p2 = index[entry[6]][7]

2890

p2 = index[entry[6]][7]

2897

node = entry[7]

2891

node = entry[7]

2898

2892

2899

sidedataactions = (False, [], {}, 0, 0)

2893

sidedataactions = (False, [], {}, 0, 0)

2900

if sidedatacompanion is not None:

2894

if sidedatacompanion is not None:

2901

sidedataactions = sidedatacompanion(self, rev)

2895

sidedataactions = sidedatacompanion(self, rev)

2902

2896

2903

# (Possibly) reuse the delta from the revlog if allowed and

2897

# (Possibly) reuse the delta from the revlog if allowed and

2904

# the revlog chunk is a delta.

2898

# the revlog chunk is a delta.

2905

cachedelta = None

2899

cachedelta = None

2906

rawtext = None

2900

rawtext = None

2907

if any(sidedataactions) or deltareuse == self.DELTAREUSEFULLADD:

2901

if any(sidedataactions) or deltareuse == self.DELTAREUSEFULLADD:

2908

dropall = sidedataactions[0]

2902

dropall = sidedataactions[0]

2909

filterout = sidedataactions[1]

2903

filterout = sidedataactions[1]

2910

update = sidedataactions[2]

2904

update = sidedataactions[2]

2911

new_flags = sidedataactions[3]

2905

new_flags = sidedataactions[3]

2912

dropped_flags = sidedataactions[4]

2906

dropped_flags = sidedataactions[4]

2913

text, sidedata = self._revisiondata(rev)

2907

text, sidedata = self._revisiondata(rev)

2914

if dropall:

2908

if dropall:

2915

sidedata = {}

2909

sidedata = {}

2916

for key in filterout:

2910

for key in filterout:

2917

sidedata.pop(key, None)

2911

sidedata.pop(key, None)

2918

sidedata.update(update)

2912

sidedata.update(update)

2919

if not sidedata:

2913

if not sidedata:

2920

sidedata = None

2914

sidedata = None

2921

2915

2922

flags |= new_flags

2916

flags |= new_flags

2923

flags &= ~dropped_flags

2917

flags &= ~dropped_flags

2924

2918

2925

destrevlog.addrevision(

2919

destrevlog.addrevision(

2926

text,

2920

text,

2927

tr,

2921

tr,

2928

linkrev,

2922

linkrev,

2929

p1,

2923

p1,

2930

p2,

2924

p2,

2931

cachedelta=cachedelta,

2925

cachedelta=cachedelta,

2932

node=node,

2926

node=node,

2933

flags=flags,

2927

flags=flags,

2934

deltacomputer=deltacomputer,

2928

deltacomputer=deltacomputer,

2935

sidedata=sidedata,

2929

sidedata=sidedata,

2936

)

2930

)

2937

else:

2931

else:

2938

if destrevlog._lazydelta:

2932

if destrevlog._lazydelta:

2939

dp = self.deltaparent(rev)

2933

dp = self.deltaparent(rev)

2940

if dp != nullrev:

2934

if dp != nullrev:

2941

cachedelta = (dp, bytes(self._chunk(rev)))

2935

cachedelta = (dp, bytes(self._chunk(rev)))

2942

2936

2943

if not cachedelta:

2937

if not cachedelta:

2944

rawtext = self.rawdata(rev)

2938

rawtext = self.rawdata(rev)

2945

2939

2946

ifh = destrevlog.opener(

2940

ifh = destrevlog.opener(

2947

destrevlog.indexfile, b'a+', checkambig=False

2941

destrevlog.indexfile, b'a+', checkambig=False

2948

)

2942

)

2949

dfh = None

2943

dfh = None

2950

if not destrevlog._inline:

2944

if not destrevlog._inline:

2951

dfh = destrevlog.opener(destrevlog.datafile, b'a+')

2945

dfh = destrevlog.opener(destrevlog.datafile, b'a+')

2952

try:

2946

try:

2953

destrevlog._addrevision(

2947

destrevlog._addrevision(

2954

node,

2948

node,

2955

rawtext,

2949

rawtext,

2956

tr,

2950

tr,

2957

linkrev,

2951

linkrev,

2958

p1,

2952

p1,

2959

p2,

2953

p2,

2960

flags,

2954

flags,

2961

cachedelta,

2955

cachedelta,

2962

ifh,

2956

ifh,

2963

dfh,

2957

dfh,

2964

deltacomputer=deltacomputer,

2958

deltacomputer=deltacomputer,

2965

)

2959

)

2966

finally:

2960

finally:

2967

if dfh:

2961

if dfh:

2968

dfh.close()

2962

dfh.close()

2969

ifh.close()

2963

ifh.close()

2970

2964

2971

if addrevisioncb:

2965

if addrevisioncb:

2972

addrevisioncb(self, rev, node)

2966

addrevisioncb(self, rev, node)

2973

2967

2974

def censorrevision(self, tr, censornode, tombstone=b''):

2968

def censorrevision(self, tr, censornode, tombstone=b''):

2975

if (self.version & 0xFFFF) == REVLOGV0:

2969

if (self.version & 0xFFFF) == REVLOGV0:

2976

raise error.RevlogError(

2970

raise error.RevlogError(

2977

_(b'cannot censor with version %d revlogs') % self.version

2971

_(b'cannot censor with version %d revlogs') % self.version

2978

)

2972

)

2979

2973

2980

censorrev = self.rev(censornode)

2974

censorrev = self.rev(censornode)

2981

tombstone = storageutil.packmeta({b'censored': tombstone}, b'')

2975

tombstone = storageutil.packmeta({b'censored': tombstone}, b'')

2982

2976

2983

if len(tombstone) > self.rawsize(censorrev):

2977

if len(tombstone) > self.rawsize(censorrev):

2984

raise error.Abort(

2978

raise error.Abort(

2985

_(b'censor tombstone must be no longer than censored data')

2979

_(b'censor tombstone must be no longer than censored data')

2986

)

2980

)

2987

2981

2988

# Rewriting the revlog in place is hard. Our strategy for censoring is

2982

# Rewriting the revlog in place is hard. Our strategy for censoring is

2989

# to create a new revlog, copy all revisions to it, then replace the

2983

# to create a new revlog, copy all revisions to it, then replace the

2990

# revlogs on transaction close.

2984

# revlogs on transaction close.

2991

2985

2992

newindexfile = self.indexfile + b'.tmpcensored'

2986

newindexfile = self.indexfile + b'.tmpcensored'

2993

newdatafile = self.datafile + b'.tmpcensored'

2987

newdatafile = self.datafile + b'.tmpcensored'

2994

2988

2995

# This is a bit dangerous. We could easily have a mismatch of state.

2989

# This is a bit dangerous. We could easily have a mismatch of state.

2996

newrl = revlog(self.opener, newindexfile, newdatafile, censorable=True)

2990

newrl = revlog(self.opener, newindexfile, newdatafile, censorable=True)

2997

newrl.version = self.version

2991

newrl.version = self.version

2998

newrl._generaldelta = self._generaldelta

2992

newrl._generaldelta = self._generaldelta

2999

newrl._io = self._io

2993

newrl._io = self._io

3000

2994

3001

for rev in self.revs():

2995

for rev in self.revs():

3002

node = self.node(rev)

2996

node = self.node(rev)

3003

p1, p2 = self.parents(node)

2997

p1, p2 = self.parents(node)

3004

2998

3005

if rev == censorrev:

2999

if rev == censorrev:

3006

newrl.addrawrevision(

3000

newrl.addrawrevision(

3007

tombstone,

3001

tombstone,

3008

tr,

3002

tr,

3009

self.linkrev(censorrev),

3003

self.linkrev(censorrev),

3010

p1,

3004

p1,

3011

p2,

3005

p2,

3012

censornode,

3006

censornode,

3013

REVIDX_ISCENSORED,

3007

REVIDX_ISCENSORED,

3014

)

3008

)

3015

3009

3016

if newrl.deltaparent(rev) != nullrev:

3010

if newrl.deltaparent(rev) != nullrev:

3017

raise error.Abort(

3011

raise error.Abort(

3018

_(

3012

_(

3019

b'censored revision stored as delta; '

3013

b'censored revision stored as delta; '

3020

b'cannot censor'

3014

b'cannot censor'

3021

),

3015

),

3022

hint=_(

3016

hint=_(

3023

b'censoring of revlogs is not '

3017

b'censoring of revlogs is not '

3024

b'fully implemented; please report '

3018

b'fully implemented; please report '

3025

b'this bug'

3019

b'this bug'

3026

),

3020

),

3027

)

3021

)

3028

continue

3022

continue

3029

3023

3030

if self.iscensored(rev):

3024

if self.iscensored(rev):

3031

if self.deltaparent(rev) != nullrev:

3025

if self.deltaparent(rev) != nullrev:

3032

raise error.Abort(

3026

raise error.Abort(

3033

_(

3027

_(

3034

b'cannot censor due to censored '

3028

b'cannot censor due to censored '

3035

b'revision having delta stored'

3029

b'revision having delta stored'

3036

)

3030

)

3037

)

3031

)

3038

rawtext = self._chunk(rev)

3032

rawtext = self._chunk(rev)

3039

else:

3033

else:

3040

rawtext = self.rawdata(rev)

3034

rawtext = self.rawdata(rev)

3041

3035

3042

newrl.addrawrevision(

3036

newrl.addrawrevision(

3043

rawtext, tr, self.linkrev(rev), p1, p2, node, self.flags(rev)

3037

rawtext, tr, self.linkrev(rev), p1, p2, node, self.flags(rev)

3044

)

3038

)

3045

3039

3046

tr.addbackup(self.indexfile, location=b'store')

3040

tr.addbackup(self.indexfile, location=b'store')

3047

if not self._inline:

3041

if not self._inline:

3048

tr.addbackup(self.datafile, location=b'store')

3042

tr.addbackup(self.datafile, location=b'store')

3049

3043

3050

self.opener.rename(newrl.indexfile, self.indexfile)

3044

self.opener.rename(newrl.indexfile, self.indexfile)

3051

if not self._inline:

3045

if not self._inline:

3052

self.opener.rename(newrl.datafile, self.datafile)

3046

self.opener.rename(newrl.datafile, self.datafile)

3053

3047

3054

self.clearcaches()

3048

self.clearcaches()

3055

self._loadindex()

3049

self._loadindex()

3056

3050

3057

def verifyintegrity(self, state):

3051

def verifyintegrity(self, state):

3058

"""Verifies the integrity of the revlog.

3052

"""Verifies the integrity of the revlog.

3059

3053

3060

Yields ``revlogproblem`` instances describing problems that are

3054

Yields ``revlogproblem`` instances describing problems that are

3061

found.

3055

found.

3062

"""

3056

"""

3063

dd, di = self.checksize()

3057

dd, di = self.checksize()

3064

if dd:

3058

if dd:

3065

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3059

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3066

if di:

3060

if di:

3067

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3061

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3068

3062

3069

version = self.version & 0xFFFF

3063

version = self.version & 0xFFFF

3070

3064

3071

# The verifier tells us what version revlog we should be.

3065

# The verifier tells us what version revlog we should be.

3072

if version != state[b'expectedversion']:

3066

if version != state[b'expectedversion']:

3073

yield revlogproblem(

3067

yield revlogproblem(

3074

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3068

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3075

% (self.indexfile, version, state[b'expectedversion'])

3069

% (self.indexfile, version, state[b'expectedversion'])

3076

)

3070

)

3077

3071

3078

state[b'skipread'] = set()

3072

state[b'skipread'] = set()

3079

state[b'safe_renamed'] = set()

3073

state[b'safe_renamed'] = set()

3080

3074

3081

for rev in self:

3075

for rev in self:

3082

node = self.node(rev)

3076

node = self.node(rev)

3083

3077

3084

# Verify contents. 4 cases to care about:

3078

# Verify contents. 4 cases to care about:

3085

#

3079

#

3086

# common: the most common case

3080

# common: the most common case

3087

# rename: with a rename

3081

# rename: with a rename

3088

# meta: file content starts with b'\1\n', the metadata

3082

# meta: file content starts with b'\1\n', the metadata

3089

# header defined in filelog.py, but without a rename

3083

# header defined in filelog.py, but without a rename

3090

# ext: content stored externally

3084

# ext: content stored externally

3091

#

3085

#

3092

# More formally, their differences are shown below:

3086

# More formally, their differences are shown below:

3093

#

3087

#

3094

# | common | rename | meta | ext

3088

# | common | rename | meta | ext

3095

# -------------------------------------------------------

3089

# -------------------------------------------------------

3096

# flags() | 0 | 0 | 0 | not 0

3090

# flags() | 0 | 0 | 0 | not 0

3097

# renamed() | False | True | False | ?

3091

# renamed() | False | True | False | ?

3098

# rawtext[0:2]=='\1\n'| False | True | True | ?

3092

# rawtext[0:2]=='\1\n'| False | True | True | ?

3099

#

3093

#

3100

# "rawtext" means the raw text stored in revlog data, which

3094

# "rawtext" means the raw text stored in revlog data, which

3101

# could be retrieved by "rawdata(rev)". "text"

3095

# could be retrieved by "rawdata(rev)". "text"

3102

# mentioned below is "revision(rev)".

3096

# mentioned below is "revision(rev)".

3103

#

3097

#

3104

# There are 3 different lengths stored physically:

3098

# There are 3 different lengths stored physically:

3105

# 1. L1: rawsize, stored in revlog index

3099

# 1. L1: rawsize, stored in revlog index

3106

# 2. L2: len(rawtext), stored in revlog data

3100

# 2. L2: len(rawtext), stored in revlog data

3107

# 3. L3: len(text), stored in revlog data if flags==0, or

3101

# 3. L3: len(text), stored in revlog data if flags==0, or

3108

# possibly somewhere else if flags!=0

3102

# possibly somewhere else if flags!=0

3109

#

3103

#

3110

# L1 should be equal to L2. L3 could be different from them.

3104

# L1 should be equal to L2. L3 could be different from them.

3111

# "text" may or may not affect commit hash depending on flag

3105

# "text" may or may not affect commit hash depending on flag

3112

# processors (see flagutil.addflagprocessor).

3106

# processors (see flagutil.addflagprocessor).

3113

#

3107

#

3114

# | common | rename | meta | ext

3108

# | common | rename | meta | ext

3115

# -------------------------------------------------

3109

# -------------------------------------------------

3116

# rawsize() | L1 | L1 | L1 | L1

3110

# rawsize() | L1 | L1 | L1 | L1

3117

# size() | L1 | L2-LM | L1(*) | L1 (?)

3111

# size() | L1 | L2-LM | L1(*) | L1 (?)

3118

# len(rawtext) | L2 | L2 | L2 | L2

3112

# len(rawtext) | L2 | L2 | L2 | L2

3119

# len(text) | L2 | L2 | L2 | L3

3113

# len(text) | L2 | L2 | L2 | L3

3120

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3114

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3121

#

3115

#

3122

# LM: length of metadata, depending on rawtext

3116

# LM: length of metadata, depending on rawtext

3123

# (*): not ideal, see comment in filelog.size

3117

# (*): not ideal, see comment in filelog.size

3124

# (?): could be "- len(meta)" if the resolved content has

3118

# (?): could be "- len(meta)" if the resolved content has

3125

# rename metadata

3119

# rename metadata

3126

#

3120

#

3127

# Checks needed to be done:

3121

# Checks needed to be done:

3128

# 1. length check: L1 == L2, in all cases.

3122

# 1. length check: L1 == L2, in all cases.

3129

# 2. hash check: depending on flag processor, we may need to

3123

# 2. hash check: depending on flag processor, we may need to

3130

# use either "text" (external), or "rawtext" (in revlog).

3124

# use either "text" (external), or "rawtext" (in revlog).

3131

3125

3132

try:

3126

try:

3133

skipflags = state.get(b'skipflags', 0)

3127

skipflags = state.get(b'skipflags', 0)

3134

if skipflags:

3128

if skipflags:

3135

skipflags &= self.flags(rev)

3129

skipflags &= self.flags(rev)

3136

3130

3137

_verify_revision(self, skipflags, state, node)

3131

_verify_revision(self, skipflags, state, node)

3138

3132

3139

l1 = self.rawsize(rev)

3133

l1 = self.rawsize(rev)

3140

l2 = len(self.rawdata(node))

3134

l2 = len(self.rawdata(node))

3141

3135

3142

if l1 != l2:

3136

if l1 != l2:

3143

yield revlogproblem(

3137

yield revlogproblem(

3144

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3138

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3145

node=node,

3139

node=node,

3146

)

3140

)

3147

3141

3148

except error.CensoredNodeError:

3142

except error.CensoredNodeError:

3149

if state[b'erroroncensored']:

3143

if state[b'erroroncensored']:

3150

yield revlogproblem(

3144

yield revlogproblem(

3151

error=_(b'censored file data'), node=node

3145

error=_(b'censored file data'), node=node

3152

)

3146

)

3153

state[b'skipread'].add(node)

3147

state[b'skipread'].add(node)

3154

except Exception as e:

3148

except Exception as e:

3155

yield revlogproblem(

3149

yield revlogproblem(

3156

error=_(b'unpacking %s: %s')

3150

error=_(b'unpacking %s: %s')

3157

% (short(node), stringutil.forcebytestr(e)),

3151

% (short(node), stringutil.forcebytestr(e)),

3158

node=node,

3152

node=node,

3159

)

3153

)

3160

state[b'skipread'].add(node)

3154

state[b'skipread'].add(node)

3161

3155

3162

def storageinfo(

3156

def storageinfo(

3163

self,

3157

self,

3164

exclusivefiles=False,

3158

exclusivefiles=False,

3165

sharedfiles=False,

3159

sharedfiles=False,

3166

revisionscount=False,

3160

revisionscount=False,

3167

trackedsize=False,

3161

trackedsize=False,

3168

storedsize=False,

3162

storedsize=False,

3169

):

3163

):

3170

d = {}

3164

d = {}

3171

3165

3172

if exclusivefiles:

3166

if exclusivefiles:

3173

d[b'exclusivefiles'] = [(self.opener, self.indexfile)]

3167

d[b'exclusivefiles'] = [(self.opener, self.indexfile)]

3174

if not self._inline:

3168

if not self._inline:

3175

d[b'exclusivefiles'].append((self.opener, self.datafile))

3169

d[b'exclusivefiles'].append((self.opener, self.datafile))

3176

3170

3177

if sharedfiles:

3171

if sharedfiles:

3178

d[b'sharedfiles'] = []

3172

d[b'sharedfiles'] = []

3179

3173

3180

if revisionscount:

3174

if revisionscount:

3181

d[b'revisionscount'] = len(self)

3175

d[b'revisionscount'] = len(self)

3182

3176

3183

if trackedsize:

3177

if trackedsize:

3184

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3178

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3185

3179

3186

if storedsize:

3180

if storedsize:

3187

d[b'storedsize'] = sum(

3181

d[b'storedsize'] = sum(

3188

self.opener.stat(path).st_size for path in self.files()

3182

self.opener.stat(path).st_size for path in self.files()

3189

)

3183

)

3190

3184

3191

return d

3185

return d

3192

3186

3193

def rewrite_sidedata(self, helpers, startrev, endrev):

3187

def rewrite_sidedata(self, helpers, startrev, endrev):

3194

if self.version & 0xFFFF != REVLOGV2:

3188

if self.version & 0xFFFF != REVLOGV2:

3195

return

3189

return

3196

# inline are not yet supported because they suffer from an issue when

3190

# inline are not yet supported because they suffer from an issue when

3197

# rewriting them (since it's not an append-only operation).

3191

# rewriting them (since it's not an append-only operation).

3198

# See issue6485.

3192

# See issue6485.

3199

assert not self._inline

3193

assert not self._inline

3200

if not helpers[1] and not helpers[2]:

3194

if not helpers[1] and not helpers[2]:

3201

# Nothing to generate or remove

3195

# Nothing to generate or remove

3202

return

3196

return

3203

3197

3204

new_entries = []

3198

new_entries = []

3205

# append the new sidedata

3199

# append the new sidedata

3206

with self._datafp(b'a+') as fp:

3200

with self._datafp(b'a+') as fp:

3207

# Maybe this bug still exists, see revlog._writeentry

3201

# Maybe this bug still exists, see revlog._writeentry

3208

fp.seek(0, os.SEEK_END)

3202

fp.seek(0, os.SEEK_END)

3209

current_offset = fp.tell()

3203

current_offset = fp.tell()

3210

for rev in range(startrev, endrev + 1):

3204

for rev in range(startrev, endrev + 1):

3211

entry = self.index[rev]

3205

entry = self.index[rev]

3212

new_sidedata = storageutil.run_sidedata_helpers(

3206

new_sidedata = storageutil.run_sidedata_helpers(

3213

store=self,

3207

store=self,

3214

sidedata_helpers=helpers,

3208

sidedata_helpers=helpers,

3215

sidedata={},

3209

sidedata={},

3216

rev=rev,

3210

rev=rev,

3217

)

3211

)

3218

3212

3219

serialized_sidedata = sidedatautil.serialize_sidedata(

3213

serialized_sidedata = sidedatautil.serialize_sidedata(

3220

new_sidedata

3214

new_sidedata

3221

)

3215

)

3222

if entry[8] != 0 or entry[9] != 0:

3216

if entry[8] != 0 or entry[9] != 0:

3223

# rewriting entries that already have sidedata is not

3217

# rewriting entries that already have sidedata is not

3224

# supported yet, because it introduces garbage data in the

3218

# supported yet, because it introduces garbage data in the

3225

# revlog.

3219

# revlog.

3226

msg = b"Rewriting existing sidedata is not supported yet"

3220

msg = b"Rewriting existing sidedata is not supported yet"

3227

raise error.Abort(msg)

3221

raise error.Abort(msg)

3228

entry = entry[:8]

3222

entry = entry[:8]

3229

entry += (current_offset, len(serialized_sidedata))

3223

entry += (current_offset, len(serialized_sidedata))

3230

3224

3231

fp.write(serialized_sidedata)

3225

fp.write(serialized_sidedata)

3232

new_entries.append(entry)

3226

new_entries.append(entry)

3233

current_offset += len(serialized_sidedata)

3227

current_offset += len(serialized_sidedata)

3234

3228

3235

# rewrite the new index entries

3229

# rewrite the new index entries

3236

with self._indexfp(b'w+') as fp:

3230

with self._indexfp(b'w+') as fp:

3237

fp.seek(startrev * self.index.entry_size)

3231

fp.seek(startrev * self.index.entry_size)

3238

for i, entry in enumerate(new_entries):

3232

for i, entry in enumerate(new_entries):

3239

rev = startrev + i

3233

rev = startrev + i

3240

self.index.replace_sidedata_info(rev, entry[8], entry[9])

3234

self.index.replace_sidedata_info(rev, entry[8], entry[9])

3241

packed = self._io.packentry(entry, self.node, self.version, rev)

3235

packed = self._io.packentry(entry, self.node, self.version, rev)

3242

fp.write(packed)

3236

fp.write(packed)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             #
             # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             from __future__ import absolute_import
             import binascii
             import collections
             import contextlib
             import errno
             import io
             import os
             import struct
             import zlib
             # import stuff from node for others to import from revlog
             from .node import (
                 bin,
                 hex,
                 nullhex,
                 nullid,
                 nullrev,
                 sha1nodeconstants,
                 short,
                 wdirfilenodeids,
                 wdirhex,
                 wdirid,
                 wdirrev,
             )
             from .i18n import _
             from .pycompat import getattr
             from .revlogutils.constants import (
                 FLAG_GENERALDELTA,
                 FLAG_INLINE_DATA,
                 INDEX_ENTRY_V0,
                 INDEX_ENTRY_V1,
                 INDEX_ENTRY_V2,
                 INDEX_HEADER,
                 REVLOGV0,
                 REVLOGV1,
                 REVLOGV1_FLAGS,
                 REVLOGV2,
                 REVLOGV2_FLAGS,
                 REVLOG_DEFAULT_FLAGS,
                 REVLOG_DEFAULT_FORMAT,
                 REVLOG_DEFAULT_VERSION,
             )
             from .revlogutils.flagutil import (
                 REVIDX_DEFAULT_FLAGS,
                 REVIDX_ELLIPSIS,
                 REVIDX_EXTSTORED,
                 REVIDX_FLAGS_ORDER,
                 REVIDX_HASCOPIESINFO,
                 REVIDX_ISCENSORED,
                 REVIDX_RAWTEXT_CHANGING_FLAGS,
                 REVIDX_SIDEDATA,
             )
             from .thirdparty import attr
             from . import (
                 ancestor,
                 dagop,
                 error,
                 mdiff,
                 policy,
                 pycompat,
                 templatefilters,
                 util,
             )
             from .interfaces import (
                 repository,
                 util as interfaceutil,
             )
             from .revlogutils import (
                 deltas as deltautil,
                 flagutil,
                 nodemap as nodemaputil,
                 sidedata as sidedatautil,
             )
             from .utils import (
                 storageutil,
                 stringutil,
             )
             # blanked usage of all the name to prevent pyflakes constraints
             # We need these name available in the module for extensions.
             REVLOGV0
             REVLOGV1
             REVLOGV2
             FLAG_INLINE_DATA
             FLAG_GENERALDELTA
             REVLOG_DEFAULT_FLAGS
             REVLOG_DEFAULT_FORMAT
             REVLOG_DEFAULT_VERSION
             REVLOGV1_FLAGS
             REVLOGV2_FLAGS
             REVIDX_ISCENSORED
             REVIDX_ELLIPSIS
             REVIDX_SIDEDATA
             REVIDX_HASCOPIESINFO
             REVIDX_EXTSTORED
             REVIDX_DEFAULT_FLAGS
             REVIDX_FLAGS_ORDER
             REVIDX_RAWTEXT_CHANGING_FLAGS
             parsers = policy.importmod('parsers')
             rustancestor = policy.importrust('ancestor')
             rustdagop = policy.importrust('dagop')
             rustrevlog = policy.importrust('revlog')
             # Aliased for performance.
             _zlibdecompress = zlib.decompress
             # max size of revlog with inline data
             _maxinline = 131072
             _chunksize = 1048576
             # Flag processors for REVIDX_ELLIPSIS.
             def ellipsisreadprocessor(rl, text):
                 return text, False
             def ellipsiswriteprocessor(rl, text):
                 return text, False
             def ellipsisrawprocessor(rl, text):
                 return False
             ellipsisprocessor = (
                 ellipsisreadprocessor,
                 ellipsiswriteprocessor,
                 ellipsisrawprocessor,
             )
             def getoffset(q):
                 return int(q >> 16)
             def gettype(q):
                 return int(q & 0xFFFF)
             def offset_type(offset, type):
                 if (type & ~flagutil.REVIDX_KNOWN_FLAGS) != 0:
                     raise ValueError(b'unknown revlog index flags')
                 return int(int(offset) << 16 | type)
             def _verify_revision(rl, skipflags, state, node):
                 """Verify the integrity of the given revlog ``node`` while providing a hook
                 point for extensions to influence the operation."""
                 if skipflags:
                     state[b'skipread'].add(node)
                 else:
                     # Side-effect: read content and verify hash.
                     rl.revision(node)
             # True if a fast implementation for persistent-nodemap is available
             #
             # We also consider we have a "fast" implementation in "pure" python because
             # people using pure don't really have performance consideration (and a
             # wheelbarrow of other slowness source)
             HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or util.safehasattr(
                 parsers, 'BaseIndexObject'
             )
             @attr.s(slots=True, frozen=True)
             class _revisioninfo(object):
                 """Information about a revision that allows building its fulltext
                 node:       expected hash of the revision
                 p1, p2:     parent revs of the revision
                 btext:      built text cache consisting of a one-element list
                 cachedelta: (baserev, uncompressed_delta) or None
                 flags:      flags associated to the revision storage
                 One of btext[0] or cachedelta must be set.
                 """
                 node = attr.ib()
                 p1 = attr.ib()
                 p2 = attr.ib()
                 btext = attr.ib()
                 textlen = attr.ib()
                 cachedelta = attr.ib()
                 flags = attr.ib()
             @interfaceutil.implementer(repository.irevisiondelta)
             @attr.s(slots=True)
             class revlogrevisiondelta(object):
                 node = attr.ib()
                 p1node = attr.ib()
                 p2node = attr.ib()
                 basenode = attr.ib()
                 flags = attr.ib()
                 baserevisionsize = attr.ib()
                 revision = attr.ib()
                 delta = attr.ib()
                 sidedata = attr.ib()
                 linknode = attr.ib(default=None)
             @interfaceutil.implementer(repository.iverifyproblem)
             @attr.s(frozen=True)
             class revlogproblem(object):
                 warning = attr.ib(default=None)
                 error = attr.ib(default=None)
                 node = attr.ib(default=None)
             class revlogoldindex(list):
                 entry_size = INDEX_ENTRY_V0.size
                 @property
                 def nodemap(self):
                     msg = b"index.nodemap is deprecated, use index.[has_node|rev|get_rev]"
                     util.nouideprecwarn(msg, b'5.3', stacklevel=2)
                     return self._nodemap
                 @util.propertycache
                 def _nodemap(self):
                     nodemap = nodemaputil.NodeMap({nullid: nullrev})
                     for r in range(0, len(self)):
                         n = self[r][7]
                         nodemap[n] = r
                     return nodemap
                 def has_node(self, node):
                     """return True if the node exist in the index"""
                     return node in self._nodemap
                 def rev(self, node):
                     """return a revision for a node
                     If the node is unknown, raise a RevlogError"""
                     return self._nodemap[node]
                 def get_rev(self, node):
                     """return a revision for a node
                     If the node is unknown, return None"""
                     return self._nodemap.get(node)
                 def append(self, tup):
                     self._nodemap[tup[7]] = len(self)
                     super(revlogoldindex, self).append(tup)
                 def __delitem__(self, i):
                     if not isinstance(i, slice) or not i.stop == -1 or i.step is not None:
                         raise ValueError(b"deleting slices only supports a:-1 with step 1")
                     for r in pycompat.xrange(i.start, len(self)):
                         del self._nodemap[self[r][7]]
                     super(revlogoldindex, self).__delitem__(i)
                 def clearcaches(self):
                     self.__dict__.pop('_nodemap', None)
                 def __getitem__(self, i):
                     if i == -1:
                         return (0, 0, 0, -1, -1, -1, -1, nullid)
                     return list.__getitem__(self, i)
             class revlogoldio(object):
                 def parseindex(self, data, inline):
                     s = INDEX_ENTRY_V0.size
                     index = []
                     nodemap = nodemaputil.NodeMap({nullid: nullrev})
                     n = off = 0
                     l = len(data)
                     while off + s <= l:
                         cur = data[off : off + s]
                         off += s
                         e = INDEX_ENTRY_V0.unpack(cur)
                         # transform to revlogv1 format
                         e2 = (
                             offset_type(e[0], 0),
                             e[1],
                             -1,
                             e[2],
                             e[3],
                             nodemap.get(e[4], nullrev),
                             nodemap.get(e[5], nullrev),
                             e[6],
                         )
                         index.append(e2)
                         nodemap[e[6]] = n
                         n += 1
                     index = revlogoldindex(index)
                     return index, None
                 def packentry(self, entry, node, version, rev):
                     """return the binary representation of an entry
                     entry:   a tuple containing all the values (see index.__getitem__)
                     node:    a callback to convert a revision to nodeid
                     version: the changelog version
                     rev:     the revision number
                     """
                     if gettype(entry[0]):
                         raise error.RevlogError(
                             _(b'index entry flags need revlog version 1')
                         )
                     e2 = (
                         getoffset(entry[0]),
                         entry[1],
                         entry[3],
                         entry[4],
                         node(entry[5]),
                         node(entry[6]),
                         entry[7],
                     )
                     return INDEX_ENTRY_V0.pack(*e2)
             # corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
             # signed integer)
             _maxentrysize = 0x7FFFFFFF
             class revlogio(object):
                 def parseindex(self, data, inline):
                     # call the C implementation to parse the index data
                     index, cache = parsers.parse_index2(data, inline)
                     return index, cache
                 def packentry(self, entry, node, version, rev):
                     p = INDEX_ENTRY_V1.pack(*entry)
                     if rev == 0:
                         p = INDEX_HEADER.pack(version) + p[4:]
                     return p
             class revlogv2io(object):
                 def parseindex(self, data, inline):
                     index, cache = parsers.parse_index2(data, inline, revlogv2=True)
                     return index, cache
                 def packentry(self, entry, node, version, rev):
                     p = INDEX_ENTRY_V2.pack(*entry)
                     if rev == 0:
                         p = INDEX_HEADER.pack(version) + p[4:]
                     return p
             NodemapRevlogIO = None
             if util.safehasattr(parsers, 'parse_index_devel_nodemap'):
                 class NodemapRevlogIO(revlogio):
                     """A debug oriented IO class that return a PersistentNodeMapIndexObject
                     The PersistentNodeMapIndexObject object is meant to test the persistent nodemap feature.
                     """
                     def parseindex(self, data, inline):
                         index, cache = parsers.parse_index_devel_nodemap(data, inline)
                         return index, cache
             class rustrevlogio(revlogio):
                 def parseindex(self, data, inline):
                     index, cache = super(rustrevlogio, self).parseindex(data, inline)
                     return rustrevlog.MixedIndex(index), cache
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 If checkambig, indexfile is opened with checkambig=True at
                 writing, to avoid file stat ambiguity.
                 If mmaplargeindex is True, and an mmapindexthreshold is set, the
                 index will be mmapped rather than read if it is larger than the
                 configured threshold.
                 If censorable is True, the revlog can have censored revisions.
                 If `upperboundcomp` is not None, this is the expected maximal gain from
                 compression for the data content.
                 `concurrencychecker` is an optional function that receives 3 arguments: a
                 file handle, a filename, and an expected position. It should check whether
                 the current position in the file handle is valid, and log/warn/fail (by
                 raising).
                 """
                 _flagserrorclass = error.RevlogError
                 def __init__(
                     self,
                     opener,
                     indexfile,
                     datafile=None,
                     checkambig=False,
                     mmaplargeindex=False,
                     censorable=False,
                     upperboundcomp=None,
                     persistentnodemap=False,
                     concurrencychecker=None,
                 ):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.upperboundcomp = upperboundcomp
                     self.indexfile = indexfile
                     self.datafile = datafile or (indexfile[:-2] + b".d")
                     self.nodemap_file = None
                     if persistentnodemap:
                         self.nodemap_file = nodemaputil.get_nodemap_file(
                             opener, self.indexfile
                         )
                     self.opener = opener
                     #  When True, indexfile is opened with checkambig=True at writing, to
                     #  avoid file stat ambiguity.
                     self._checkambig = checkambig
                     self._mmaplargeindex = mmaplargeindex
                     self._censorable = censorable
                     # 3-tuple of (node, rev, text) for a raw revision.
                     self._revisioncache = None
                     # Maps rev to chain base rev.
                     self._chainbasecache = util.lrucachedict(100)
                     # 2-tuple of (offset, data) of raw data from the revlog at an offset.
                     self._chunkcache = (0, b'')
                     # How much data to read and cache into the raw revlog data cache.
                     self._chunkcachesize = 65536
                     self._maxchainlen = None
                     self._deltabothparents = True
                     self.index = None
                     self._nodemap_docket = None
                     # Mapping of partial identifiers to full nodes.
                     self._pcache = {}
                     # Mapping of revision integer to full node.
                     self._compengine = b'zlib'
                     self._compengineopts = {}
                     self._maxdeltachainspan = -1
                     self._withsparseread = False
                     self._sparserevlog = False
                     self._srdensitythreshold = 0.50
                     self._srmingapsize = 262144
                     # Make copy of flag processors so each revlog instance can support
                     # custom flags.
                     self._flagprocessors = dict(flagutil.flagprocessors)
                     # 2-tuple of file handles being used for active writing.
                     self._writinghandles = None
                     self._loadindex()
                     self._concurrencychecker = concurrencychecker
                 def _loadindex(self):
                     mmapindexthreshold = None
                     opts = self.opener.options
                     if b'revlogv2' in opts:
                         newversionflags = REVLOGV2 | FLAG_INLINE_DATA
                     elif b'revlogv1' in opts:
                         newversionflags = REVLOGV1 | FLAG_INLINE_DATA
                         if b'generaldelta' in opts:
                             newversionflags |= FLAG_GENERALDELTA
                     elif b'revlogv0' in self.opener.options:
                         newversionflags = REVLOGV0
                     else:
                         newversionflags = REVLOG_DEFAULT_VERSION
                     if b'chunkcachesize' in opts:
                         self._chunkcachesize = opts[b'chunkcachesize']
                     if b'maxchainlen' in opts:
                         self._maxchainlen = opts[b'maxchainlen']
                     if b'deltabothparents' in opts:
                         self._deltabothparents = opts[b'deltabothparents']
                     self._lazydelta = bool(opts.get(b'lazydelta', True))
                     self._lazydeltabase = False
                     if self._lazydelta:
                         self._lazydeltabase = bool(opts.get(b'lazydeltabase', False))
                     if b'compengine' in opts:
                         self._compengine = opts[b'compengine']
                     if b'zlib.level' in opts:
                         self._compengineopts[b'zlib.level'] = opts[b'zlib.level']
                     if b'zstd.level' in opts:
                         self._compengineopts[b'zstd.level'] = opts[b'zstd.level']
                     if b'maxdeltachainspan' in opts:
                         self._maxdeltachainspan = opts[b'maxdeltachainspan']
                     if self._mmaplargeindex and b'mmapindexthreshold' in opts:
                         mmapindexthreshold = opts[b'mmapindexthreshold']
                     self.hassidedata = bool(opts.get(b'side-data', False))
                     self._sparserevlog = bool(opts.get(b'sparse-revlog', False))
                     withsparseread = bool(opts.get(b'with-sparse-read', False))
                     # sparse-revlog forces sparse-read
                     self._withsparseread = self._sparserevlog or withsparseread
                     if b'sparse-read-density-threshold' in opts:
                         self._srdensitythreshold = opts[b'sparse-read-density-threshold']
                     if b'sparse-read-min-gap-size' in opts:
                         self._srmingapsize = opts[b'sparse-read-min-gap-size']
                     if opts.get(b'enableellipsis'):
                         self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor
                     # revlog v0 doesn't have flag processors
                     for flag, processor in pycompat.iteritems(
                         opts.get(b'flagprocessors', {})
                     ):
                         flagutil.insertflagprocessor(flag, processor, self._flagprocessors)
                     if self._chunkcachesize <= 0:
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not greater than 0')
                             % self._chunkcachesize
                         )
                     elif self._chunkcachesize & (self._chunkcachesize - 1):
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not a power of 2')
                             % self._chunkcachesize
                         )
                     indexdata = b''
                     self._initempty = True
                     try:
                         with self._indexfp() as f:
                             if (
                                 mmapindexthreshold is not None
                                 and self.opener.fstat(f).st_size >= mmapindexthreshold
                             ):
                                 # TODO: should .close() to release resources without
                                 # relying on Python GC
                                 indexdata = util.buffer(util.mmapread(f))
                             else:
                                 indexdata = f.read()
                         if len(indexdata) > 0:
                             versionflags = INDEX_HEADER.unpack(indexdata[:4])[0]
                             self._initempty = False
                         else:
                             versionflags = newversionflags
                     except IOError as inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         versionflags = newversionflags
                     self.version = versionflags
                     flags = versionflags & ~0xFFFF
                     fmt = versionflags & 0xFFFF
                     if fmt == REVLOGV0:
                         if flags:
                             raise error.RevlogError(
                                 _(b'unknown flags (%#04x) in version %d revlog %s')
                                 % (flags >> 16, fmt, self.indexfile)
                             )
                         self._inline = False
                         self._generaldelta = False
                     elif fmt == REVLOGV1:
                         if flags & ~REVLOGV1_FLAGS:
                             raise error.RevlogError(
                                 _(b'unknown flags (%#04x) in version %d revlog %s')
                                 % (flags >> 16, fmt, self.indexfile)
                             )
                         self._inline = versionflags & FLAG_INLINE_DATA
                         self._generaldelta = versionflags & FLAG_GENERALDELTA
                     elif fmt == REVLOGV2:
                         if flags & ~REVLOGV2_FLAGS:
                             raise error.RevlogError(
                                 _(b'unknown flags (%#04x) in version %d revlog %s')
                                 % (flags >> 16, fmt, self.indexfile)
                             )
                         # There is a bug in the transaction handling when going from an
                         # inline revlog to a separate index and data file. Turn it off until
                         # it's fixed, since v2 revlogs sometimes get rewritten on exchange.
                         # See issue6485
                         self._inline = False
                         # generaldelta implied by version 2 revlogs.
                         self._generaldelta = True
                     else:
                         raise error.RevlogError(
                             _(b'unknown version (%d) in revlog %s') % (fmt, self.indexfile)
                         )
                     self.nodeconstants = sha1nodeconstants
                     self.nullid = self.nodeconstants.nullid
                     # sparse-revlog can't be on without general-delta (issue6056)
                     if not self._generaldelta:
                         self._sparserevlog = False
                     self._storedeltachains = True
                     devel_nodemap = (
                         self.nodemap_file
                         and opts.get(b'devel-force-nodemap', False)
                         and NodemapRevlogIO is not None
                     )
                     use_rust_index = False
                     if rustrevlog is not None:
                         if self.nodemap_file is not None:
                             use_rust_index = True
                         else:
                             use_rust_index = self.opener.options.get(b'rust.index')
                     self._io = revlogio()
                     if self.version == REVLOGV0:
                         self._io = revlogoldio()
                     elif fmt == REVLOGV2:
                         self._io = revlogv2io()
                     elif devel_nodemap:
                         self._io = NodemapRevlogIO()
                     elif use_rust_index:
                         self._io = rustrevlogio()
                     try:
                         d = self._io.parseindex(indexdata, self._inline)
                         index, _chunkcache = d
                         use_nodemap = (
                             not self._inline
                             and self.nodemap_file is not None
                             and util.safehasattr(index, 'update_nodemap_data')
                         )
                         if use_nodemap:
                             nodemap_data = nodemaputil.persisted_data(self)
                             if nodemap_data is not None:
                                 docket = nodemap_data[0]
                                 if (
                                     len(d[0]) > docket.tip_rev
                                     and d[0][docket.tip_rev][7] == docket.tip_node
                                 ):
                                     # no changelog tampering
                                     self._nodemap_docket = docket
                                     index.update_nodemap_data(*nodemap_data)
                     except (ValueError, IndexError):
                         raise error.RevlogError(
                             _(b"index %s is corrupted") % self.indexfile
                         )
                     self.index, self._chunkcache = d
                     if not self._chunkcache:
                         self._chunkclear()
                     # revnum -> (chain-length, sum-delta-length)
                     self._chaininfocache = util.lrucachedict(500)
                     # revlog header -> revlog compressor
                     self._decompressors = {}
                 @util.propertycache
                 def _compressor(self):
                     engine = util.compengines[self._compengine]
                     return engine.revlogcompressor(self._compengineopts)
                 def _indexfp(self, mode=b'r'):
                     """file object for the revlog's index file"""
                     args = {'mode': mode}
                     if mode != b'r':
                         args['checkambig'] = self._checkambig
                     if mode == b'w':
                         args['atomictemp'] = True
                     return self.opener(self.indexfile, **args)
                 def _datafp(self, mode=b'r'):
                     """file object for the revlog's data file"""
                     return self.opener(self.datafile, mode=mode)
                 @contextlib.contextmanager
                 def _datareadfp(self, existingfp=None):
                     """file object suitable to read data"""
                     # Use explicit file handle, if given.
                     if existingfp is not None:
                         yield existingfp
                     # Use a file handle being actively used for writes, if available.
                     # There is some danger to doing this because reads will seek the
                     # file. However, _writeentry() performs a SEEK_END before all writes,
                     # so we should be safe.
                     elif self._writinghandles:
                         if self._inline:
                             yield self._writinghandles[0]
                         else:
                             yield self._writinghandles[1]
                     # Otherwise open a new file handle.
                     else:
                         if self._inline:
                             func = self._indexfp
                         else:
                             func = self._datafp
                         with func() as fp:
                             yield fp
                 def tiprev(self):
                     return len(self.index) - 1
                 def tip(self):
                     return self.node(self.tiprev())
                 def __contains__(self, rev):
                     return 0 <= rev < len(self)
                 def __len__(self):
                     return len(self.index)
                 def __iter__(self):
                     return iter(pycompat.xrange(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     return storageutil.iterrevs(len(self), start=start, stop=stop)
                 @property
                 def nodemap(self):
                     msg = (
                         b"revlog.nodemap is deprecated, "
                         b"use revlog.index.[has_node|rev|get_rev]"
                     )
                     util.nouideprecwarn(msg, b'5.3', stacklevel=2)
                     return self.index.nodemap
                 @property
                 def _nodecache(self):
                     msg = b"revlog._nodecache is deprecated, use revlog.index.nodemap"
                     util.nouideprecwarn(msg, b'5.3', stacklevel=2)
                     return self.index.nodemap
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def candelta(self, baserev, rev):
                     """whether two revisions (baserev, rev) can be delta-ed or not"""
                     # Disable delta if either rev requires a content-changing flag
                     # processor (ex. LFS). This is because such flag processor can alter
                     # the rawtext content that the delta will be based on, and two clients
                     # could have a same revlog node with different flags (i.e. different
                     # rawtext contents) and the delta could be incompatible.
                     if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (
                         self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS
                     ):
                         return False
                     return True
                 def update_caches(self, transaction):
                     if self.nodemap_file is not None:
                         if transaction is None:
                             nodemaputil.update_persistent_nodemap(self)
                         else:
                             nodemaputil.setup_persistent_nodemap(transaction, self)
                 def clearcaches(self):
                     self._revisioncache = None
                     self._chainbasecache.clear()
                     self._chunkcache = (0, b'')
                     self._pcache = {}
                     self._nodemap_docket = None
                     self.index.clearcaches()
                     # The python code is the one responsible for validating the docket, we
                     # end up having to refresh it here.
                     use_nodemap = (
                         not self._inline
                         and self.nodemap_file is not None
                         and util.safehasattr(self.index, 'update_nodemap_data')
                     )
                     if use_nodemap:
                         nodemap_data = nodemaputil.persisted_data(self)
                         if nodemap_data is not None:
                             self._nodemap_docket = nodemap_data[0]
                             self.index.update_nodemap_data(*nodemap_data)
                 def rev(self, node):
                     try:
                         return self.index.rev(node)
                     except TypeError:
                         raise
                     except error.RevlogError:
                         # parsers.c radix tree lookup failed
                         if node == wdirid or node in wdirfilenodeids:
                             raise error.WdirUnsupported
                         raise error.LookupError(node, self.indexfile, _(b'no node'))
                 # Accessors for index entries.
                 # First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
                 # are flags.
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def length(self, rev):
                     return self.index[rev][1]
                 def sidedata_length(self, rev):
                     if self.version & 0xFFFF != REVLOGV2:
                         return 0
                     return self.index[rev][9]
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.rawdata(rev)
                     return len(t)
                 def size(self, rev):
                     """length of non-raw text (processed by a "read" flag processor)"""
                     # fast path: if no "read" flag processor could change the content,
                     # size is rawsize. note: ELLIPSIS is known to not change the content.
                     flags = self.flags(rev)
                     if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
                         return self.rawsize(rev)
                     return len(self.revision(rev, raw=False))
                 def chainbase(self, rev):
                     base = self._chainbasecache.get(rev)
                     if base is not None:
                         return base
                     index = self.index
                     iterrev = rev
                     base = index[iterrev][3]
                     while base != iterrev:
                         iterrev = base
                         base = index[iterrev][3]
                     self._chainbasecache[rev] = base
                     return base
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parentrevs(self, rev):
                     try:
                         entry = self.index[rev]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
-                    if entry[5] == nullrev:
-                        return entry[6], entry[5]
-                    else:
                     return entry[5], entry[6]
                 # fast parentrevs(rev) where rev isn't filtered
                 _uncheckedparentrevs = parentrevs
                 def node(self, rev):
                     try:
                         return self.index[rev][7]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                 # Derived from index values.
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
-                    # inline node() to avoid function call overhead
+                    return i[d[5]][7], i[d[6]][7]  # map revisions to nodes inline
-                    if d[5] == nullid:
-                        return i[d[6]][7], i[d[5]][7]
-                    else:
-                        return i[d[5]][7], i[d[6]][7]
                 def chainlen(self, rev):
                     return self._chaininfo(rev)[0]
                 def _chaininfo(self, rev):
                     chaininfocache = self._chaininfocache
                     if rev in chaininfocache:
                         return chaininfocache[rev]
                     index = self.index
                     generaldelta = self._generaldelta
                     iterrev = rev
                     e = index[iterrev]
                     clen = 0
                     compresseddeltalen = 0
                     while iterrev != e[3]:
                         clen += 1
                         compresseddeltalen += e[1]
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         if iterrev in chaininfocache:
                             t = chaininfocache[iterrev]
                             clen += t[0]
                             compresseddeltalen += t[1]
                             break
                         e = index[iterrev]
                     else:
                         # Add text length of base since decompressing that also takes
                         # work. For cache hits the length is already included.
                         compresseddeltalen += e[1]
                     r = (clen, compresseddeltalen)
                     chaininfocache[rev] = r
                     return r
                 def _deltachain(self, rev, stoprev=None):
                     """Obtain the delta chain for a revision.
                     ``stoprev`` specifies a revision to stop at. If not specified, we
                     stop at the base of the chain.
                     Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
                     revs in ascending order and ``stopped`` is a bool indicating whether
                     ``stoprev`` was hit.
                     """
                     # Try C implementation.
                     try:
                         return self.index.deltachain(rev, stoprev, self._generaldelta)
                     except AttributeError:
                         pass
                     chain = []
                     # Alias to prevent attribute lookup in tight loop.
                     index = self.index
                     generaldelta = self._generaldelta
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != stoprev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == stoprev:
                         stopped = True
                     else:
                         chain.append(iterrev)
                         stopped = False
                     chain.reverse()
                     return chain, stopped
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse revision order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     # first, make sure start revisions aren't filtered
                     revs = list(revs)
                     checkrev = self.node
                     for r in revs:
                         checkrev(r)
                     # and we're sure ancestors aren't filtered as well
                     if rustancestor is not None:
                         lazyancestors = rustancestor.LazyAncestors
                         arg = self.index
                     else:
                         lazyancestors = ancestor.lazyancestors
                         arg = self._uncheckedparentrevs
                     return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)
                 def descendants(self, revs):
                     return dagop.descendantrevs(revs, self.revs, self.parentrevs)
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset(object):
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = collections.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(miss) for miss in missing]
                 def incrementalmissingrevs(self, common=None):
                     """Return an object that can be used to incrementally compute the
                     revision numbers of the ancestors of arbitrary sets that are not
                     ancestors of common. This is an ancestor.incrementalmissingancestors
                     object.
                     'common' is a list of revision numbers. If common is not supplied, uses
                     nullrev.
                     """
                     if common is None:
                         common = [nullrev]
                     if rustancestor is not None:
                         return rustancestor.MissingAncestors(self.index, common)
                     return ancestor.incrementalmissingancestors(self.parentrevs, common)
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     inc = self.incrementalmissingrevs(common=common)
                     return inc.missingancestors(heads)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     inc = self.incrementalmissingrevs(common=common)
                     return [self.node(r) for r in inc.missingancestors(heads)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid]  # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in self], [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n)  # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update(
                                         [p for p in self.parents(n) if p != nullid]
                                     )
                                 elif n in heads:  # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [root for root in roots if root in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(root) for root in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [head for head, flag in pycompat.iteritems(heads) if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self, revs=None):
                     if revs is None:
                         try:
                             return self.index.headrevs()
                         except AttributeError:
                             return self._headrevs()
                     if rustdagop is not None:
                         return rustdagop.headrevs(self.index, revs)
                     return dagop.headrevs(revs, self._uncheckedparentrevs)
                 def computephases(self, roots):
                     return self.index.computephasesmapsets(roots)
                 def _headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     # we won't iter over filtered rev so nobody is a head at start
                     ishead = [0] * (count + 1)
                     index = self.index
                     for r in self:
                         ishead[r] = 1  # I may be an head
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                     return [r for r, val in enumerate(ishead) if val]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullrev
                     else:
                         start = self.rev(start)
                     stoprevs = {self.rev(n) for n in stop or []}
                     revs = dagop.headrevssubset(
                         self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs
                     )
                     return [self.node(rev) for rev in revs]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     ancs = self._commonancestorsheads(a, b)
                     return pycompat.maplist(self.node, ancs)
                 def _commonancestorsheads(self, *revs):
                     """calculate all the heads of the common ancestors of revs"""
                     try:
                         ancs = self.index.commonancestorsheads(*revs)
                     except (AttributeError, OverflowError):  # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
                     return ancs
                 def isancestor(self, a, b):
                     """return True if node a is an ancestor of node b
                     A revision is considered an ancestor of itself."""
                     a, b = self.rev(a), self.rev(b)
                     return self.isancestorrev(a, b)
                 def isancestorrev(self, a, b):
                     """return True if revision a is an ancestor of revision b
                     A revision is considered an ancestor of itself.
                     The implementation of this is trivial but the use of
                     reachableroots is not."""
                     if a == nullrev:
                         return True
                     elif a == b:
                         return True
                     elif a > b:
                         return False
                     return bool(self.reachableroots(a, [b], [a], includepath=False))
                 def reachableroots(self, minroot, heads, roots, includepath=False):
                     """return (heads(::(<roots> and <roots>::<heads>)))
                     If includepath is True, return (<roots>::<heads>)."""
                     try:
                         return self.index.reachableroots2(
                             minroot, heads, roots, includepath
                         )
                     except AttributeError:
                         return dagop._reachablerootspure(
                             self.parentrevs, minroot, roots, heads, includepath
                         )
                 def ancestor(self, a, b):
                     """calculate the "best" common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)
                     except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
                         return min(map(self.node, ancs))
                     return nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node)  # quick search the index
                             return node
                         except error.LookupError:
                             pass  # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if b"%d" % rev != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (TypeError, error.LookupError):
                             pass
                 def _partialmatch(self, id):
                     # we don't care wdirfilenodeids as they should be always full hash
                     maybewdir = wdirhex.startswith(id)
                     try:
                         partial = self.index.partialmatch(id)
                         if partial and self.hasnode(partial):
                             if maybewdir:
                                 # single 'ff...' match in radix tree, ambiguous with wdir
                                 raise error.RevlogError
                             return partial
                         if maybewdir:
                             # no 'ff...' match in radix tree, wdir identified
                             raise error.WdirUnsupported
                         return None
                     except error.RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fast path: for unfiltered changelog, radix tree is accurate
                         if not getattr(self, 'filteredrevs', None):
                             raise error.AmbiguousPrefixLookupError(
                                 id, self.indexfile, _(b'ambiguous identifier')
                             )
                         # fall through to slow path that filters hidden revisions
                     except (AttributeError, ValueError):
                         # we are pure python, or key was too short to search radix tree
                         pass
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) <= 40:
                         try:
                             # hex(node)[:...]
                             l = len(id) // 2  # grab an even number of digits
                             prefix = bin(id[: l * 2])
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [
                                 n for n in nl if hex(n).startswith(id) and self.hasnode(n)
                             ]
                             if nullhex.startswith(id):
                                 nl.append(nullid)
                             if len(nl) > 0:
                                 if len(nl) == 1 and not maybewdir:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise error.AmbiguousPrefixLookupError(
                                     id, self.indexfile, _(b'ambiguous identifier')
                                 )
                             if maybewdir:
                                 raise error.WdirUnsupported
                             return None
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                     - revision number or str(revision number)
                     - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise error.LookupError(id, self.indexfile, _(b'no match found'))
                 def shortest(self, node, minlength=1):
                     """Find the shortest unambiguous prefix that matches node."""
                     def isvalid(prefix):
                         try:
                             matchednode = self._partialmatch(prefix)
                         except error.AmbiguousPrefixLookupError:
                             return False
                         except error.WdirUnsupported:
                             # single 'ff...' match
                             return True
                         if matchednode is None:
                             raise error.LookupError(node, self.indexfile, _(b'no node'))
                         return True
                     def maybewdir(prefix):
                         return all(c == b'f' for c in pycompat.iterbytestr(prefix))
                     hexnode = hex(node)
                     def disambiguate(hexnode, minlength):
                         """Disambiguate against wdirid."""
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if not maybewdir(prefix):
                                 return prefix
                     if not getattr(self, 'filteredrevs', None):
                         try:
                             length = max(self.index.shortest(node), minlength)
                             return disambiguate(hexnode, length)
                         except error.RevlogError:
                             if node != wdirid:
                                 raise error.LookupError(node, self.indexfile, _(b'no node'))
                         except AttributeError:
                             # Fall through to pure code
                             pass
                     if node == wdirid:
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if isvalid(prefix):
                                 return prefix
                     for length in range(minlength, len(hexnode) + 1):
                         prefix = hexnode[:length]
                         if isvalid(prefix):
                             return disambiguate(hexnode, length)
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return storageutil.hashrevisionsha1(text, p1, p2) != node
                 def _cachesegment(self, offset, data):
                     """Add a segment to the revlog cache.
                     Accepts an absolute offset and the data that is at that location.
                     """
                     o, d = self._chunkcache
                     # try to add to existing cache
                     if o + len(d) == offset and len(d) + len(data) < _chunksize:
                         self._chunkcache = o, d + data
                     else:
                         self._chunkcache = offset, data
                 def _readsegment(self, offset, length, df=None):
                     """Load a segment of raw data from the revlog.
                     Accepts an absolute offset, length to read, and an optional existing
                     file handle to read from.
                     If an existing file handle is passed, it will be seeked and the
                     original seek position will NOT be restored.
                     Returns a str or buffer of raw byte data.
                     Raises if the requested number of bytes could not be read.
                     """
                     # Cache data both forward and backward around the requested
                     # data, in a fixed size window. This helps speed up operations
                     # involving reading the revlog backwards.
                     cachesize = self._chunkcachesize
                     realoffset = offset & ~(cachesize - 1)
                     reallength = (
                         (offset + length + cachesize) & ~(cachesize - 1)
                     ) - realoffset
                     with self._datareadfp(df) as df:
                         df.seek(realoffset)
                         d = df.read(reallength)
                     self._cachesegment(realoffset, d)
                     if offset != realoffset or reallength != length:
                         startoffset = offset - realoffset
                         if len(d) - startoffset < length:
                             raise error.RevlogError(
                                 _(
                                     b'partial read of revlog %s; expected %d bytes from '
                                     b'offset %d, got %d'
                                 )
                                 % (
                                     self.indexfile if self._inline else self.datafile,
                                     length,
                                     realoffset,
                                     len(d) - startoffset,
                                 )
                             )
                         return util.buffer(d, startoffset, length)
                     if len(d) < length:
                         raise error.RevlogError(
                             _(
                                 b'partial read of revlog %s; expected %d bytes from offset '
                                 b'%d, got %d'
                             )
                             % (
                                 self.indexfile if self._inline else self.datafile,
                                 length,
                                 offset,
                                 len(d),
                             )
                         )
                     return d
                 def _getsegment(self, offset, length, df=None):
                     """Obtain a segment of raw data from the revlog.
                     Accepts an absolute offset, length of bytes to obtain, and an
                     optional file handle to the already-opened revlog. If the file
                     handle is used, it's original seek position will not be preserved.
                     Requests for data may be returned from a cache.
                     Returns a str or a buffer instance of raw byte data.
                     """
                     o, d = self._chunkcache
                     l = len(d)
                     # is it in the cache?
                     cachestart = offset - o
                     cacheend = cachestart + length
                     if cachestart >= 0 and cacheend <= l:
                         if cachestart == 0 and cacheend == l:
                             return d  # avoid a copy
                         return util.buffer(d, cachestart, cacheend - cachestart)
                     return self._readsegment(offset, length, df=df)
                 def _getsegmentforrevs(self, startrev, endrev, df=None):
                     """Obtain a segment of raw data corresponding to a range of revisions.
                     Accepts the start and end revisions and an optional already-open
                     file handle to be used for reading. If the file handle is read, its
                     seek position will not be preserved.
                     Requests for data may be satisfied by a cache.
                     Returns a 2-tuple of (offset, data) for the requested range of
                     revisions. Offset is the integer offset from the beginning of the
                     revlog and data is a str or buffer of the raw byte data.
                     Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
                     to determine where each revision's data begins and ends.
                     """
                     # Inlined self.start(startrev) & self.end(endrev) for perf reasons
                     # (functions are expensive).
                     index = self.index
                     istart = index[startrev]
                     start = int(istart[0] >> 16)
                     if startrev == endrev:
                         end = start + istart[1]
                     else:
                         iend = index[endrev]
                         end = int(iend[0] >> 16) + iend[1]
                     if self._inline:
                         start += (startrev + 1) * self.index.entry_size
                         end += (endrev + 1) * self.index.entry_size
                     length = end - start
                     return start, self._getsegment(start, length, df=df)
                 def _chunk(self, rev, df=None):
                     """Obtain a single decompressed chunk for a revision.
                     Accepts an integer revision and an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will not
                     be preserved.
                     Returns a str holding uncompressed data for the requested revision.
                     """
                     return self.decompress(self._getsegmentforrevs(rev, rev, df=df)[1])
                 def _chunks(self, revs, df=None, targetsize=None):
                     """Obtain decompressed chunks for the specified revisions.
                     Accepts an iterable of numeric revisions that are assumed to be in
                     ascending order. Also accepts an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will
                     not be preserved.
                     This function is similar to calling ``self._chunk()`` multiple times,
                     but is faster.
                     Returns a list with decompressed data for each requested revision.
                     """
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self._inline
                     iosize = self.index.entry_size
                     buffer = util.buffer
                     l = []
                     ladd = l.append
                     if not self._withsparseread:
                         slicedchunks = (revs,)
                     else:
                         slicedchunks = deltautil.slicechunk(
                             self, revs, targetsize=targetsize
                         )
                     for revschunk in slicedchunks:
                         firstrev = revschunk[0]
                         # Skip trailing revisions with empty diff
                         for lastrev in revschunk[::-1]:
                             if length(lastrev) != 0:
                                 break
                         try:
                             offset, data = self._getsegmentforrevs(firstrev, lastrev, df=df)
                         except OverflowError:
                             # issue4215 - we can't cache a run of chunks greater than
                             # 2G on Windows
                             return [self._chunk(rev, df=df) for rev in revschunk]
                         decomp = self.decompress
                         for rev in revschunk:
                             chunkstart = start(rev)
                             if inline:
                                 chunkstart += (rev + 1) * iosize
                             chunklength = length(rev)
                             ladd(decomp(buffer(data, chunkstart - offset, chunklength)))
                     return l
                 def _chunkclear(self):
                     """Clear the raw chunk cache."""
                     self._chunkcache = (0, b'')
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self._generaldelta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     if not self._sparserevlog:
                         return self.deltaparent(rev) == nullrev
                     elif util.safehasattr(self.index, b'issnapshot'):
                         # directly assign the method to cache the testing and access
                         self.issnapshot = self.index.issnapshot
                         return self.issnapshot(rev)
                     if rev == nullrev:
                         return True
                     entry = self.index[rev]
                     base = entry[3]
                     if base == rev:
                         return True
                     if base == nullrev:
                         return True
                     p1 = entry[5]
                     p2 = entry[6]
                     if base == p1 or base == p2:
                         return False
                     return self.issnapshot(base)
                 def snapshotdepth(self, rev):
                     """number of snapshot in the chain before this one"""
                     if not self.issnapshot(rev):
                         raise error.ProgrammingError(b'revision %d not a snapshot')
                     return len(self._deltachain(rev)[0]) - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions
                     The delta calculated is in binary form and is intended to be written to
                     revlog data directly. So this function needs raw revision data.
                     """
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return bytes(self._chunk(rev2))
                     return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))
                 def _processflags(self, text, flags, operation, raw=False):
                     """deprecated entry point to access flag processors"""
                     msg = b'_processflag(...) use the specialized variant'
                     util.nouideprecwarn(msg, b'5.2', stacklevel=2)
                     if raw:
                         return text, flagutil.processflagsraw(self, text, flags)
                     elif operation == b'read':
                         return flagutil.processflagsread(self, text, flags)
                     else:  # write operation
                         return flagutil.processflagswrite(self, text, flags)
                 def revision(self, nodeorrev, _df=None, raw=False):
                     """return an uncompressed revision of a given node or revision
                     number.
                     _df - an existing file handle to read from. (internal-only)
                     raw - an optional argument specifying if the revision data is to be
                     treated as raw data when applying flag transforms. 'raw' should be set
                     to True when generating changegroups or in debug commands.
                     """
                     if raw:
                         msg = (
                             b'revlog.revision(..., raw=True) is deprecated, '
                             b'use revlog.rawdata(...)'
                         )
                         util.nouideprecwarn(msg, b'5.2', stacklevel=2)
                     return self._revisiondata(nodeorrev, _df, raw=raw)[0]
                 def sidedata(self, nodeorrev, _df=None):
                     """a map of extra data related to the changeset but not part of the hash
                     This function currently return a dictionary. However, more advanced
                     mapping object will likely be used in the future for a more
                     efficient/lazy code.
                     """
                     return self._revisiondata(nodeorrev, _df)[1]
                 def _revisiondata(self, nodeorrev, _df=None, raw=False):
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     # fast path the special `nullid` rev
                     if node == nullid:
                         return b"", {}
                     # ``rawtext`` is the text as stored inside the revlog. Might be the
                     # revision or might need to be processed to retrieve the revision.
                     rev, rawtext, validated = self._rawtext(node, rev, _df=_df)
                     if self.version & 0xFFFF == REVLOGV2:
                         if rev is None:
                             rev = self.rev(node)
                         sidedata = self._sidedata(rev)
                     else:
                         sidedata = {}
                     if raw and validated:
                         # if we don't want to process the raw text and that raw
                         # text is cached, we can exit early.
                         return rawtext, sidedata
                     if rev is None:
                         rev = self.rev(node)
                     # the revlog's flag for this revision
                     # (usually alter its state or content)
                     flags = self.flags(rev)
                     if validated and flags == REVIDX_DEFAULT_FLAGS:
                         # no extra flags set, no flag processor runs, text = rawtext
                         return rawtext, sidedata
                     if raw:
                         validatehash = flagutil.processflagsraw(self, rawtext, flags)
                         text = rawtext
                     else:
                         r = flagutil.processflagsread(self, rawtext, flags)
                         text, validatehash = r
                     if validatehash:
                         self.checkhash(text, node, rev=rev)
                     if not validated:
                         self._revisioncache = (node, rev, rawtext)
                     return text, sidedata
                 def _rawtext(self, node, rev, _df=None):
                     """return the possibly unvalidated rawtext for a revision
                     returns (rev, rawtext, validated)
                     """
                     # revision in the cache (could be useful to apply delta)
                     cachedrev = None
                     # An intermediate text to apply deltas to
                     basetext = None
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._revisioncache:
                         if self._revisioncache[0] == node:
                             return (rev, self._revisioncache[2], True)
                         cachedrev = self._revisioncache[1]
                     if rev is None:
                         rev = self.rev(node)
                     chain, stopped = self._deltachain(rev, stoprev=cachedrev)
                     if stopped:
                         basetext = self._revisioncache[2]
                     # drop cache to save memory, the caller is expected to
                     # update self._revisioncache after validating the text
                     self._revisioncache = None
                     targetsize = None
                     rawsize = self.index[rev][2]
                     if 0 <= rawsize:
                         targetsize = 4 * rawsize
                     bins = self._chunks(chain, df=_df, targetsize=targetsize)
                     if basetext is None:
                         basetext = bytes(bins[0])
                         bins = bins[1:]
                     rawtext = mdiff.patches(basetext, bins)
                     del basetext  # let us have a chance to free memory early
                     return (rev, rawtext, False)
                 def _sidedata(self, rev):
                     """Return the sidedata for a given revision number."""
                     index_entry = self.index[rev]
                     sidedata_offset = index_entry[8]
                     sidedata_size = index_entry[9]
                     if self._inline:
                         sidedata_offset += self.index.entry_size * (1 + rev)
                     if sidedata_size == 0:
                         return {}
                     segment = self._getsegment(sidedata_offset, sidedata_size)
                     sidedata = sidedatautil.deserialize_sidedata(segment)
                     return sidedata
                 def rawdata(self, nodeorrev, _df=None):
                     """return an uncompressed raw data of a given node or revision number.
                     _df - an existing file handle to read from. (internal-only)
                     """
                     return self._revisiondata(nodeorrev, _df, raw=True)[0]
                 def hash(self, text, p1, p2):
                     """Compute a node hash.
                     Available as a function so that subclasses can replace the hash
                     as needed.
                     """
                     return storageutil.hashrevisionsha1(text, p1, p2)
                 def checkhash(self, text, node, p1=None, p2=None, rev=None):
                     """Check node hash integrity.
                     Available as a function so that subclasses can extend hash mismatch
                     behaviors as needed.
                     """
                     try:
                         if p1 is None and p2 is None:
                             p1, p2 = self.parents(node)
                         if node != self.hash(text, p1, p2):
                             # Clear the revision cache on hash failure. The revision cache
                             # only stores the raw revision and clearing the cache does have
                             # the side-effect that we won't have a cache hit when the raw
                             # revision data is accessed. But this case should be rare and
                             # it is extra work to teach the cache about the hash
                             # verification state.
                             if self._revisioncache and self._revisioncache[0] == node:
                                 self._revisioncache = None
                             revornode = rev
                             if revornode is None:
                                 revornode = templatefilters.short(hex(node))
                             raise error.RevlogError(
                                 _(b"integrity check failed on %s:%s")
                                 % (self.indexfile, pycompat.bytestr(revornode))
                             )
                     except error.RevlogError:
                         if self._censorable and storageutil.iscensoredtext(text):
                             raise error.CensoredNodeError(self.indexfile, node, text)
                         raise
                 def _enforceinlinesize(self, tr, fp=None):
                     """Check if the revlog is too big for inline and convert if so.
                     This should be called after revisions are added to the revlog. If the
                     revlog has grown too large to be an inline revlog, it will convert it
                     to use multiple index and data files.
                     """
                     tiprev = len(self) - 1
                     if (
                         not self._inline
                         or (self.start(tiprev) + self.length(tiprev)) < _maxinline
                     ):
                         return
                     troffset = tr.findoffset(self.indexfile)
                     if troffset is None:
                         raise error.RevlogError(
                             _(b"%s not found in the transaction") % self.indexfile
                         )
                     trindex = 0
                     tr.add(self.datafile, 0)
                     if fp:
                         fp.flush()
                         fp.close()
                         # We can't use the cached file handle after close(). So prevent
                         # its usage.
                         self._writinghandles = None
                     with self._indexfp(b'r') as ifh, self._datafp(b'w') as dfh:
                         for r in self:
                             dfh.write(self._getsegmentforrevs(r, r, df=ifh)[1])
                             if troffset <= self.start(r):
                                 trindex = r
                     with self._indexfp(b'w') as fp:
                         self.version &= ~FLAG_INLINE_DATA
                         self._inline = False
                         io = self._io
                         for i in self:
                             e = io.packentry(self.index[i], self.node, self.version, i)
                             fp.write(e)
                         # the temp file replace the real index when we exit the context
                         # manager
                     tr.replace(self.indexfile, trindex * self.index.entry_size)
                     nodemaputil.setup_persistent_nodemap(tr, self)
                     self._chunkclear()
                 def _nodeduplicatecallback(self, transaction, node):
                     """called when trying to add a node already stored."""
                 def addrevision(
                     self,
                     text,
                     transaction,
                     link,
                     p1,
                     p2,
                     cachedelta=None,
                     node=None,
                     flags=REVIDX_DEFAULT_FLAGS,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     flags - the known flags to set on the revision
                     deltacomputer - an optional deltacomputer instance shared between
                         multiple calls
                     """
                     if link == nullrev:
                         raise error.RevlogError(
                             _(b"attempted to add linkrev -1 to %s") % self.indexfile
                         )
                     if sidedata is None:
                         sidedata = {}
                     elif not self.hassidedata:
                         raise error.ProgrammingError(
                             _(b"trying to add sidedata to a revlog who don't support them")
                         )
                     if flags:
                         node = node or self.hash(text, p1, p2)
                     rawtext, validatehash = flagutil.processflagswrite(self, text, flags)
                     # If the flag processor modifies the revision data, ignore any provided
                     # cachedelta.
                     if rawtext != text:
                         cachedelta = None
                     if len(rawtext) > _maxentrysize:
                         raise error.RevlogError(
                             _(
                                 b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"
                             )
                             % (self.indexfile, len(rawtext))
                         )
                     node = node or self.hash(rawtext, p1, p2)
                     rev = self.index.get_rev(node)
                     if rev is not None:
                         return rev
                     if validatehash:
                         self.checkhash(rawtext, node, p1=p1, p2=p2)
                     return self.addrawrevision(
                         rawtext,
                         transaction,
                         link,
                         p1,
                         p2,
                         node,
                         flags,
                         cachedelta=cachedelta,
                         deltacomputer=deltacomputer,
                         sidedata=sidedata,
                     )
                 def addrawrevision(
                     self,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     node,
                     flags,
                     cachedelta=None,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a raw revision with known flags, node and parents
                     useful when reusing a revision not stored in this revlog (ex: received
                     over wire, or read from an external bundle).
                     """
                     dfh = None
                     if not self._inline:
                         dfh = self._datafp(b"a+")
                     ifh = self._indexfp(b"a+")
                     try:
                         return self._addrevision(
                             node,
                             rawtext,
                             transaction,
                             link,
                             p1,
                             p2,
                             flags,
                             cachedelta,
                             ifh,
                             dfh,
                             deltacomputer=deltacomputer,
                             sidedata=sidedata,
                         )
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                 def compress(self, data):
                     """Generate a possibly-compressed representation of data."""
                     if not data:
                         return b'', data
                     compressed = self._compressor.compress(data)
                     if compressed:
                         # The revlog compressor added the header in the returned data.
                         return b'', compressed
                     if data[0:1] == b'\0':
                         return b'', data
                     return b'u', data
                 def decompress(self, data):
                     """Decompress a revlog chunk.
                     The chunk is expected to begin with a header identifying the
                     format type so it can be routed to an appropriate decompressor.
                     """
                     if not data:
                         return data
                     # Revlogs are read much more frequently than they are written and many
                     # chunks only take microseconds to decompress, so performance is
                     # important here.
                     #
                     # We can make a few assumptions about revlogs:
                     #
                     # 1) the majority of chunks will be compressed (as opposed to inline
                     #    raw data).
                     # 2) decompressing *any* data will likely by at least 10x slower than
                     #    returning raw inline data.
                     # 3) we want to prioritize common and officially supported compression
                     #    engines
                     #
                     # It follows that we want to optimize for "decompress compressed data
                     # when encoded with common and officially supported compression engines"
                     # case over "raw data" and "data encoded by less common or non-official
                     # compression engines." That is why we have the inline lookup first
                     # followed by the compengines lookup.
                     #
                     # According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
                     # compressed chunks. And this matters for changelog and manifest reads.
                     t = data[0:1]
                     if t == b'x':
                         try:
                             return _zlibdecompress(data)
                         except zlib.error as e:
                             raise error.RevlogError(
                                 _(b'revlog decompress error: %s')
                                 % stringutil.forcebytestr(e)
                             )
                     # '\0' is more common than 'u' so it goes first.
                     elif t == b'\0':
                         return data
                     elif t == b'u':
                         return util.buffer(data, 1)
                     try:
                         compressor = self._decompressors[t]
                     except KeyError:
                         try:
                             engine = util.compengines.forrevlogheader(t)
                             compressor = engine.revlogcompressor(self._compengineopts)
                             self._decompressors[t] = compressor
                         except KeyError:
                             raise error.RevlogError(
                                 _(b'unknown compression type %s') % binascii.hexlify(t)
                             )
                     return compressor.decompress(data)
                 def _addrevision(
                     self,
                     node,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     flags,
                     cachedelta,
                     ifh,
                     dfh,
                     alwayscache=False,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
                     if "deltacomputer" is not provided or None, a defaultdeltacomputer will
                     be used.
                     invariants:
                     - rawtext is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     if node == nullid:
                         raise error.RevlogError(
                             _(b"%s: attempt to add null revision") % self.indexfile
                         )
                     if node == wdirid or node in wdirfilenodeids:
                         raise error.RevlogError(
                             _(b"%s: attempt to add wdir revision") % self.indexfile
                         )
                     if self._inline:
                         fh = ifh
                     else:
                         fh = dfh
                     btext = [rawtext]
                     curr = len(self)
                     prev = curr - 1
                     offset = self._get_data_offset(prev)
                     if self._concurrencychecker:
                         if self._inline:
                             # offset is "as if" it were in the .d file, so we need to add on
                             # the size of the entry metadata.
                             self._concurrencychecker(
                                 ifh, self.indexfile, offset + curr * self.index.entry_size
                             )
                         else:
                             # Entries in the .i are a consistent size.
                             self._concurrencychecker(
                                 ifh, self.indexfile, curr * self.index.entry_size
                             )
                             self._concurrencychecker(dfh, self.datafile, offset)
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if rawtext is None:
                         # need rawtext size, before changed by flag processors, which is
                         # the non-raw size. use revlog explicitly to avoid filelog's extra
                         # logic that might remove metadata size.
                         textlen = mdiff.patchedsize(
                             revlog.size(self, cachedelta[0]), cachedelta[1]
                         )
                     else:
                         textlen = len(rawtext)
                     if deltacomputer is None:
                         deltacomputer = deltautil.deltacomputer(self)
                     revinfo = _revisioninfo(node, p1, p2, btext, textlen, cachedelta, flags)
                     deltainfo = deltacomputer.finddeltainfo(revinfo, fh)
                     if sidedata:
                         serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)
                         sidedata_offset = offset + deltainfo.deltalen
                     else:
                         serialized_sidedata = b""
                         # Don't store the offset if the sidedata is empty, that way
                         # we can easily detect empty sidedata and they will be no different
                         # than ones we manually add.
                         sidedata_offset = 0
                     e = (
                         offset_type(offset, flags),
                         deltainfo.deltalen,
                         textlen,
                         deltainfo.base,
                         link,
                         p1r,
                         p2r,
                         node,
                         sidedata_offset,
                         len(serialized_sidedata),
                     )
                     if self.version & 0xFFFF != REVLOGV2:
                         e = e[:8]
                     self.index.append(e)
                     entry = self._io.packentry(e, self.node, self.version, curr)
                     self._writeentry(
                         transaction,
                         ifh,
                         dfh,
                         entry,
                         deltainfo.data,
                         link,
                         offset,
                         serialized_sidedata,
                     )
                     rawtext = btext[0]
                     if alwayscache and rawtext is None:
                         rawtext = deltacomputer.buildtext(revinfo, fh)
                     if type(rawtext) == bytes:  # only accept immutable objects
                         self._revisioncache = (node, curr, rawtext)
                     self._chainbasecache[curr] = deltainfo.chainbase
                     return curr
                 def _get_data_offset(self, prev):
                     """Returns the current offset in the (in-transaction) data file.
                     Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket
                     file to store that information: since sidedata can be rewritten to the
                     end of the data file within a transaction, you can have cases where, for
                     example, rev `n` does not have sidedata while rev `n - 1` does, leading
                     to `n - 1`'s sidedata being written after `n`'s data.
                     TODO cache this in a docket file before getting out of experimental."""
                     if self.version & 0xFFFF != REVLOGV2:
                         return self.end(prev)
                     offset = 0
                     for rev, entry in enumerate(self.index):
                         sidedata_end = entry[8] + entry[9]
                         # Sidedata for a previous rev has potentially been written after
                         # this rev's end, so take the max.
                         offset = max(self.end(rev), offset, sidedata_end)
                     return offset
                 def _writeentry(
                     self, transaction, ifh, dfh, entry, data, link, offset, sidedata
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     ifh.seek(0, os.SEEK_END)
                     if dfh:
                         dfh.seek(0, os.SEEK_END)
                     curr = len(self) - 1
                     if not self._inline:
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         if sidedata:
                             dfh.write(sidedata)
                         ifh.write(entry)
                     else:
                         offset += curr * self.index.entry_size
                         transaction.add(self.indexfile, offset)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         if sidedata:
                             ifh.write(sidedata)
                         self._enforceinlinesize(transaction, ifh)
                     nodemaputil.setup_persistent_nodemap(transaction, self)
                 def addgroup(
                     self,
                     deltas,
                     linkmapper,
                     transaction,
                     alwayscache=False,
                     addrevisioncb=None,
                     duplicaterevisioncb=None,
                 ):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     If ``addrevisioncb`` is defined, it will be called with arguments of
                     this revlog and the node that was added.
                     """
                     if self._writinghandles:
                         raise error.ProgrammingError(b'cannot nest addgroup() calls')
                     r = len(self)
                     end = 0
                     if r:
                         end = self.end(r - 1)
                     ifh = self._indexfp(b"a+")
                     isize = r * self.index.entry_size
                     if self._inline:
                         transaction.add(self.indexfile, end + isize)
                         dfh = None
                     else:
                         transaction.add(self.indexfile, isize)
                         transaction.add(self.datafile, end)
                         dfh = self._datafp(b"a+")
                     def flush():
                         if dfh:
                             dfh.flush()
                         ifh.flush()
                     self._writinghandles = (ifh, dfh)
                     empty = True
                     try:
                         deltacomputer = deltautil.deltacomputer(self)
                         # loop through our set of deltas
                         for data in deltas:
                             node, p1, p2, linknode, deltabase, delta, flags, sidedata = data
                             link = linkmapper(linknode)
                             flags = flags or REVIDX_DEFAULT_FLAGS
                             rev = self.index.get_rev(node)
                             if rev is not None:
                                 # this can happen if two branches make the same change
                                 self._nodeduplicatecallback(transaction, rev)
                                 if duplicaterevisioncb:
                                     duplicaterevisioncb(self, rev)
                                 empty = False
                                 continue
                             for p in (p1, p2):
                                 if not self.index.has_node(p):
                                     raise error.LookupError(
                                         p, self.indexfile, _(b'unknown parent')
                                     )
                             if not self.index.has_node(deltabase):
                                 raise error.LookupError(
                                     deltabase, self.indexfile, _(b'unknown delta base')
                                 )
                             baserev = self.rev(deltabase)
                             if baserev != nullrev and self.iscensored(baserev):
                                 # if base is censored, delta must be full replacement in a
                                 # single patch operation
                                 hlen = struct.calcsize(b">lll")
                                 oldlen = self.rawsize(baserev)
                                 newlen = len(delta) - hlen
                                 if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):
                                     raise error.CensoredBaseError(
                                         self.indexfile, self.node(baserev)
                                     )
                             if not flags and self._peek_iscensored(baserev, delta, flush):
                                 flags |= REVIDX_ISCENSORED
                             # We assume consumers of addrevisioncb will want to retrieve
                             # the added revision, which will require a call to
                             # revision(). revision() will fast path if there is a cache
                             # hit. So, we tell _addrevision() to always cache in this case.
                             # We're only using addgroup() in the context of changegroup
                             # generation so the revision data can always be handled as raw
                             # by the flagprocessor.
                             rev = self._addrevision(
                                 node,
                                 None,
                                 transaction,
                                 link,
                                 p1,
                                 p2,
                                 flags,
                                 (baserev, delta),
                                 ifh,
                                 dfh,
                                 alwayscache=alwayscache,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                             if addrevisioncb:
                                 addrevisioncb(self, rev)
                             empty = False
                             if not dfh and not self._inline:
                                 # addrevision switched from inline to conventional
                                 # reopen the index
                                 ifh.close()
                                 dfh = self._datafp(b"a+")
                                 ifh = self._indexfp(b"a+")
                                 self._writinghandles = (ifh, dfh)
                     finally:
                         self._writinghandles = None
                         if dfh:
                             dfh.close()
                         ifh.close()
                     return not empty
                 def iscensored(self, rev):
                     """Check if a file revision is censored."""
                     if not self._censorable:
                         return False
                     return self.flags(rev) & REVIDX_ISCENSORED
                 def _peek_iscensored(self, baserev, delta, flush):
                     """Quickly check if a delta produces a censored revision."""
                     if not self._censorable:
                         return False
                     return storageutil.deltaiscensored(delta, baserev, self.rawsize)
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     return storageutil.resolvestripinfo(
                         minlink,
                         len(self) - 1,
                         self.headrevs(),
                         self.linkrev,
                         self.parentrevs,
                     )
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self._inline:
                         transaction.add(self.datafile, end)
                         end = rev * self.index.entry_size
                     else:
                         end += rev * self.index.entry_size
                     transaction.add(self.indexfile, end)
                     # then reset internal state in memory to forget those revisions
                     self._revisioncache = None
                     self._chaininfocache = util.lrucachedict(500)
                     self._chunkclear()
                     del self.index[rev:-1]
                 def checksize(self):
                     """Check size of index and data files
                     return a (dd, di) tuple.
                     - dd: extra bytes for the "data" file
                     - di: extra bytes for the "index" file
                     A healthy revlog will return (0, 0).
                     """
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         with self._datafp() as f:
                             f.seek(0, io.SEEK_END)
                             actual = f.tell()
                         dd = actual - expected
                     except IOError as inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, io.SEEK_END)
                         actual = f.tell()
                         f.close()
                         s = self.index.entry_size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except IOError as inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self.indexfile]
                     if not self._inline:
                         res.append(self.datafile)
                     return res
                 def emitrevisions(
                     self,
                     nodes,
                     nodesorder=None,
                     revisiondata=False,
                     assumehaveparentrevisions=False,
                     deltamode=repository.CG_DELTAMODE_STD,
                     sidedata_helpers=None,
                 ):
                     if nodesorder not in (b'nodes', b'storage', b'linear', None):
                         raise error.ProgrammingError(
                             b'unhandled value for nodesorder: %s' % nodesorder
                         )
                     if nodesorder is None and not self._generaldelta:
                         nodesorder = b'storage'
                     if (
                         not self._storedeltachains
                         and deltamode != repository.CG_DELTAMODE_PREV
                     ):
                         deltamode = repository.CG_DELTAMODE_FULL
                     return storageutil.emitrevisions(
                         self,
                         nodes,
                         nodesorder,
                         revlogrevisiondelta,
                         deltaparentfn=self.deltaparent,
                         candeltafn=self.candelta,
                         rawsizefn=self.rawsize,
                         revdifffn=self.revdiff,
                         flagsfn=self.flags,
                         deltamode=deltamode,
                         revisiondata=revisiondata,
                         assumehaveparentrevisions=assumehaveparentrevisions,
                         sidedata_helpers=sidedata_helpers,
                     )
                 DELTAREUSEALWAYS = b'always'
                 DELTAREUSESAMEREVS = b'samerevs'
                 DELTAREUSENEVER = b'never'
                 DELTAREUSEFULLADD = b'fulladd'
                 DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}
                 def clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb=None,
                     deltareuse=DELTAREUSESAMEREVS,
                     forcedeltabothparents=None,
                     sidedatacompanion=None,
                 ):
                     """Copy this revlog to another, possibly with format changes.
                     The destination revlog will contain the same revisions and nodes.
                     However, it may not be bit-for-bit identical due to e.g. delta encoding
                     differences.
                     The ``deltareuse`` argument control how deltas from the existing revlog
                     are preserved in the destination revlog. The argument can have the
                     following values:
                     DELTAREUSEALWAYS
                        Deltas will always be reused (if possible), even if the destination
                        revlog would not select the same revisions for the delta. This is the
                        fastest mode of operation.
                     DELTAREUSESAMEREVS
                        Deltas will be reused if the destination revlog would pick the same
                        revisions for the delta. This mode strikes a balance between speed
                        and optimization.
                     DELTAREUSENEVER
                        Deltas will never be reused. This is the slowest mode of execution.
                        This mode can be used to recompute deltas (e.g. if the diff/delta
                        algorithm changes).
                     DELTAREUSEFULLADD
                        Revision will be re-added as if their were new content. This is
                        slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.
                        eg: large file detection and handling.
                     Delta computation can be slow, so the choice of delta reuse policy can
                     significantly affect run time.
                     The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
                     two extremes. Deltas will be reused if they are appropriate. But if the
                     delta could choose a better revision, it will do so. This means if you
                     are converting a non-generaldelta revlog to a generaldelta revlog,
                     deltas will be recomputed if the delta's parent isn't a parent of the
                     revision.
                     In addition to the delta policy, the ``forcedeltabothparents``
                     argument controls whether to force compute deltas against both parents
                     for merges. By default, the current default is used.
                     If not None, the `sidedatacompanion` is callable that accept two
                     arguments:
                         (srcrevlog, rev)
                     and return a quintet that control changes to sidedata content from the
                     old revision to the new clone result:
                         (dropall, filterout, update, new_flags, dropped_flags)
                     * if `dropall` is True, all sidedata should be dropped
                     * `filterout` is a set of sidedata keys that should be dropped
                     * `update` is a mapping of additionnal/new key -> value
                     * new_flags is a bitfields of new flags that the revision should get
                     * dropped_flags is a bitfields of new flags that the revision shoudl not longer have
                     """
                     if deltareuse not in self.DELTAREUSEALL:
                         raise ValueError(
                             _(b'value for deltareuse invalid: %s') % deltareuse
                         )
                     if len(destrevlog):
                         raise ValueError(_(b'destination revlog is not empty'))
                     if getattr(self, 'filteredrevs', None):
                         raise ValueError(_(b'source revlog has filtered revisions'))
                     if getattr(destrevlog, 'filteredrevs', None):
                         raise ValueError(_(b'destination revlog has filtered revisions'))
                     # lazydelta and lazydeltabase controls whether to reuse a cached delta,
                     # if possible.
                     oldlazydelta = destrevlog._lazydelta
                     oldlazydeltabase = destrevlog._lazydeltabase
                     oldamd = destrevlog._deltabothparents
                     try:
                         if deltareuse == self.DELTAREUSEALWAYS:
                             destrevlog._lazydeltabase = True
                             destrevlog._lazydelta = True
                         elif deltareuse == self.DELTAREUSESAMEREVS:
                             destrevlog._lazydeltabase = False
                             destrevlog._lazydelta = True
                         elif deltareuse == self.DELTAREUSENEVER:
                             destrevlog._lazydeltabase = False
                             destrevlog._lazydelta = False
                         destrevlog._deltabothparents = forcedeltabothparents or oldamd
                         self._clone(
                             tr,
                             destrevlog,
                             addrevisioncb,
                             deltareuse,
                             forcedeltabothparents,
                             sidedatacompanion,
                         )
                     finally:
                         destrevlog._lazydelta = oldlazydelta
                         destrevlog._lazydeltabase = oldlazydeltabase
                         destrevlog._deltabothparents = oldamd
                 def _clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb,
                     deltareuse,
                     forcedeltabothparents,
                     sidedatacompanion,
                 ):
                     """perform the core duty of `revlog.clone` after parameter processing"""
                     deltacomputer = deltautil.deltacomputer(destrevlog)
                     index = self.index
                     for rev in self:
                         entry = index[rev]
                         # Some classes override linkrev to take filtered revs into
                         # account. Use raw entry from index.
                         flags = entry[0] & 0xFFFF
                         linkrev = entry[4]
                         p1 = index[entry[5]][7]
                         p2 = index[entry[6]][7]
                         node = entry[7]
                         sidedataactions = (False, [], {}, 0, 0)
                         if sidedatacompanion is not None:
                             sidedataactions = sidedatacompanion(self, rev)
                         # (Possibly) reuse the delta from the revlog if allowed and
                         # the revlog chunk is a delta.
                         cachedelta = None
                         rawtext = None
                         if any(sidedataactions) or deltareuse == self.DELTAREUSEFULLADD:
                             dropall = sidedataactions[0]
                             filterout = sidedataactions[1]
                             update = sidedataactions[2]
                             new_flags = sidedataactions[3]
                             dropped_flags = sidedataactions[4]
                             text, sidedata = self._revisiondata(rev)
                             if dropall:
                                 sidedata = {}
                             for key in filterout:
                                 sidedata.pop(key, None)
                             sidedata.update(update)
                             if not sidedata:
                                 sidedata = None
                             flags |= new_flags
                             flags &= ~dropped_flags
                             destrevlog.addrevision(
                                 text,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 cachedelta=cachedelta,
                                 node=node,
                                 flags=flags,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         else:
                             if destrevlog._lazydelta:
                                 dp = self.deltaparent(rev)
                                 if dp != nullrev:
                                     cachedelta = (dp, bytes(self._chunk(rev)))
                             if not cachedelta:
                                 rawtext = self.rawdata(rev)
                             ifh = destrevlog.opener(
                                 destrevlog.indexfile, b'a+', checkambig=False
                             )
                             dfh = None
                             if not destrevlog._inline:
                                 dfh = destrevlog.opener(destrevlog.datafile, b'a+')
                             try:
                                 destrevlog._addrevision(
                                     node,
                                     rawtext,
                                     tr,
                                     linkrev,
                                     p1,
                                     p2,
                                     flags,
                                     cachedelta,
                                     ifh,
                                     dfh,
                                     deltacomputer=deltacomputer,
                                 )
                             finally:
                                 if dfh:
                                     dfh.close()
                                 ifh.close()
                         if addrevisioncb:
                             addrevisioncb(self, rev, node)
                 def censorrevision(self, tr, censornode, tombstone=b''):
                     if (self.version & 0xFFFF) == REVLOGV0:
                         raise error.RevlogError(
                             _(b'cannot censor with version %d revlogs') % self.version
                         )
                     censorrev = self.rev(censornode)
                     tombstone = storageutil.packmeta({b'censored': tombstone}, b'')
                     if len(tombstone) > self.rawsize(censorrev):
                         raise error.Abort(
                             _(b'censor tombstone must be no longer than censored data')
                         )
                     # Rewriting the revlog in place is hard. Our strategy for censoring is
                     # to create a new revlog, copy all revisions to it, then replace the
                     # revlogs on transaction close.
                     newindexfile = self.indexfile + b'.tmpcensored'
                     newdatafile = self.datafile + b'.tmpcensored'
                     # This is a bit dangerous. We could easily have a mismatch of state.
                     newrl = revlog(self.opener, newindexfile, newdatafile, censorable=True)
                     newrl.version = self.version
                     newrl._generaldelta = self._generaldelta
                     newrl._io = self._io
                     for rev in self.revs():
                         node = self.node(rev)
                         p1, p2 = self.parents(node)
                         if rev == censorrev:
                             newrl.addrawrevision(
                                 tombstone,
                                 tr,
                                 self.linkrev(censorrev),
                                 p1,
                                 p2,
                                 censornode,
                                 REVIDX_ISCENSORED,
                             )
                             if newrl.deltaparent(rev) != nullrev:
                                 raise error.Abort(
                                     _(
                                         b'censored revision stored as delta; '
                                         b'cannot censor'
                                     ),
                                     hint=_(
                                         b'censoring of revlogs is not '
                                         b'fully implemented; please report '
                                         b'this bug'
                                     ),
                                 )
                             continue
                         if self.iscensored(rev):
                             if self.deltaparent(rev) != nullrev:
                                 raise error.Abort(
                                     _(
                                         b'cannot censor due to censored '
                                         b'revision having delta stored'
                                     )
                                 )
                             rawtext = self._chunk(rev)
                         else:
                             rawtext = self.rawdata(rev)
                         newrl.addrawrevision(
                             rawtext, tr, self.linkrev(rev), p1, p2, node, self.flags(rev)
                         )
                     tr.addbackup(self.indexfile, location=b'store')
                     if not self._inline:
                         tr.addbackup(self.datafile, location=b'store')
                     self.opener.rename(newrl.indexfile, self.indexfile)
                     if not self._inline:
                         self.opener.rename(newrl.datafile, self.datafile)
                     self.clearcaches()
                     self._loadindex()
                 def verifyintegrity(self, state):
                     """Verifies the integrity of the revlog.
                     Yields ``revlogproblem`` instances describing problems that are
                     found.
                     """
                     dd, di = self.checksize()
                     if dd:
                         yield revlogproblem(error=_(b'data length off by %d bytes') % dd)
                     if di:
                         yield revlogproblem(error=_(b'index contains %d extra bytes') % di)
                     version = self.version & 0xFFFF
                     # The verifier tells us what version revlog we should be.
                     if version != state[b'expectedversion']:
                         yield revlogproblem(
                             warning=_(b"warning: '%s' uses revlog format %d; expected %d")
                             % (self.indexfile, version, state[b'expectedversion'])
                         )
                     state[b'skipread'] = set()
                     state[b'safe_renamed'] = set()
                     for rev in self:
                         node = self.node(rev)
                         # Verify contents. 4 cases to care about:
                         #
                         #   common: the most common case
                         #   rename: with a rename
                         #   meta: file content starts with b'\1\n', the metadata
                         #         header defined in filelog.py, but without a rename
                         #   ext: content stored externally
                         #
                         # More formally, their differences are shown below:
                         #
                         #                       | common | rename | meta  | ext
                         #  -------------------------------------------------------
                         #   flags()             | 0      | 0      | 0     | not 0
                         #   renamed()           | False  | True   | False | ?
                         #   rawtext[0:2]=='\1\n'| False  | True   | True  | ?
                         #
                         # "rawtext" means the raw text stored in revlog data, which
                         # could be retrieved by "rawdata(rev)". "text"
                         # mentioned below is "revision(rev)".
                         #
                         # There are 3 different lengths stored physically:
                         #  1. L1: rawsize, stored in revlog index
                         #  2. L2: len(rawtext), stored in revlog data
                         #  3. L3: len(text), stored in revlog data if flags==0, or
                         #     possibly somewhere else if flags!=0
                         #
                         # L1 should be equal to L2. L3 could be different from them.
                         # "text" may or may not affect commit hash depending on flag
                         # processors (see flagutil.addflagprocessor).
                         #
                         #              | common  | rename | meta  | ext
                         # -------------------------------------------------
                         #    rawsize() | L1      | L1     | L1    | L1
                         #       size() | L1      | L2-LM  | L1(*) | L1 (?)
                         # len(rawtext) | L2      | L2     | L2    | L2
                         #    len(text) | L2      | L2     | L2    | L3
                         #  len(read()) | L2      | L2-LM  | L2-LM | L3 (?)
                         #
                         # LM:  length of metadata, depending on rawtext
                         # (*): not ideal, see comment in filelog.size
                         # (?): could be "- len(meta)" if the resolved content has
                         #      rename metadata
                         #
                         # Checks needed to be done:
                         #  1. length check: L1 == L2, in all cases.
                         #  2. hash check: depending on flag processor, we may need to
                         #     use either "text" (external), or "rawtext" (in revlog).
                         try:
                             skipflags = state.get(b'skipflags', 0)
                             if skipflags:
                                 skipflags &= self.flags(rev)
                             _verify_revision(self, skipflags, state, node)
                             l1 = self.rawsize(rev)
                             l2 = len(self.rawdata(node))
                             if l1 != l2:
                                 yield revlogproblem(
                                     error=_(b'unpacked size is %d, %d expected') % (l2, l1),
                                     node=node,
                                 )
                         except error.CensoredNodeError:
                             if state[b'erroroncensored']:
                                 yield revlogproblem(
                                     error=_(b'censored file data'), node=node
                                 )
                                 state[b'skipread'].add(node)
                         except Exception as e:
                             yield revlogproblem(
                                 error=_(b'unpacking %s: %s')
                                 % (short(node), stringutil.forcebytestr(e)),
                                 node=node,
                             )
                             state[b'skipread'].add(node)
                 def storageinfo(
                     self,
                     exclusivefiles=False,
                     sharedfiles=False,
                     revisionscount=False,
                     trackedsize=False,
                     storedsize=False,
                 ):
                     d = {}
                     if exclusivefiles:
                         d[b'exclusivefiles'] = [(self.opener, self.indexfile)]
                         if not self._inline:
                             d[b'exclusivefiles'].append((self.opener, self.datafile))
                     if sharedfiles:
                         d[b'sharedfiles'] = []
                     if revisionscount:
                         d[b'revisionscount'] = len(self)
                     if trackedsize:
                         d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))
                     if storedsize:
                         d[b'storedsize'] = sum(
                             self.opener.stat(path).st_size for path in self.files()
                         )
                     return d
                 def rewrite_sidedata(self, helpers, startrev, endrev):
                     if self.version & 0xFFFF != REVLOGV2:
                         return
                     # inline are not yet supported because they suffer from an issue when
                     # rewriting them (since it's not an append-only operation).
                     # See issue6485.
                     assert not self._inline
                     if not helpers[1] and not helpers[2]:
                         # Nothing to generate or remove
                         return
                     new_entries = []
                     # append the new sidedata
                     with self._datafp(b'a+') as fp:
                         # Maybe this bug still exists, see revlog._writeentry
                         fp.seek(0, os.SEEK_END)
                         current_offset = fp.tell()
                         for rev in range(startrev, endrev + 1):
                             entry = self.index[rev]
                             new_sidedata = storageutil.run_sidedata_helpers(
                                 store=self,
                                 sidedata_helpers=helpers,
                                 sidedata={},
                                 rev=rev,
                             )
                             serialized_sidedata = sidedatautil.serialize_sidedata(
                                 new_sidedata
                             )
                             if entry[8] != 0 or entry[9] != 0:
                                 # rewriting entries that already have sidedata is not
                                 # supported yet, because it introduces garbage data in the
                                 # revlog.
                                 msg = b"Rewriting existing sidedata is not supported yet"
                                 raise error.Abort(msg)
                             entry = entry[:8]
                             entry += (current_offset, len(serialized_sidedata))
                             fp.write(serialized_sidedata)
                             new_entries.append(entry)
                             current_offset += len(serialized_sidedata)
                     # rewrite the new index entries
                     with self._indexfp(b'w+') as fp:
                         fp.seek(startrev * self.index.entry_size)
                         for i, entry in enumerate(new_entries):
                             rev = startrev + i
                             self.index.replace_sidedata_info(rev, entry[8], entry[9])
                             packed = self._io.packentry(entry, self.node, self.version, rev)
                             fp.write(packed)

             ===============================================================
             Test non-regression on the corruption associated with issue6528
             ===============================================================
             Setup
             -----
               $ hg init base-repo
               $ cd base-repo
               $ cat <<EOF > a.txt
               > 1
               > 2
               > 3
               > 4
               > 5
               > 6
               > EOF
               $ hg add a.txt
               $ hg commit -m 'c_base_c - create a.txt'
             Modify a.txt
               $ sed -e 's/1/foo/' a.txt > a.tmp; mv a.tmp a.txt
               $ hg commit -m 'c_modify_c - modify a.txt'
             Modify and rename a.txt to b.txt
               $ hg up -r "desc('c_base_c')"
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ sed -e 's/6/bar/' a.txt > a.tmp; mv a.tmp a.txt
               $ hg mv a.txt b.txt
               $ hg commit -m 'c_rename_c - rename and modify a.txt to b.txt'
               created new head
             Merge each branch
               $ hg merge -r "desc('c_modify_c')"
               merging b.txt and a.txt to b.txt
 files updated, 1 files merged, 0 files removed, 0 files unresolved
               (branch merge, don't forget to commit)
               $ hg commit -m 'c_merge_c: commit merge'
               $ hg debugrevlogindex b.txt
                  rev linkrev nodeid       p1           p2
 2 05b806ebe5ea 000000000000 000000000000
 3 a58b36ad6b65 000000000000 05b806ebe5ea
             Check commit Graph
               $ hg log -G
               @    changeset:   3:a1cc2bdca0aa
               |\   tag:         tip
               | |  parent:      2:615c6ccefd15
               | |  parent:      1:373d507f4667
               | |  user:        test
               | |  date:        Thu Jan 01 00:00:00 1970 +0000
               | |  summary:     c_merge_c: commit merge
               | |
               | o  changeset:   2:615c6ccefd15
               | |  parent:      0:f5a5a568022f
               | |  user:        test
               | |  date:        Thu Jan 01 00:00:00 1970 +0000
               | |  summary:     c_rename_c - rename and modify a.txt to b.txt
               | |
               o |  changeset:   1:373d507f4667
               |/   user:        test
               |    date:        Thu Jan 01 00:00:00 1970 +0000
               |    summary:     c_modify_c - modify a.txt
               |
               o  changeset:   0:f5a5a568022f
                  user:        test
                  date:        Thu Jan 01 00:00:00 1970 +0000
                  summary:     c_base_c - create a.txt
               $ hg cat -r . b.txt
               foo
               bar
               $ cat b.txt
               foo
               bar
               $ cd ..
             Check the lack of corruption
             ----------------------------
               $ hg clone --pull base-repo cloned
               requesting all changes
               adding changesets
               adding manifests
               adding file changes
               added 4 changesets with 4 changes to 2 files
               new changesets f5a5a568022f:a1cc2bdca0aa
               updating to branch default
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cd cloned
               $ hg up -r "desc('c_merge_c')"
 files updated, 0 files merged, 0 files removed, 0 files unresolved
             Status is buggy, even with debugrebuilddirstate
               $ hg cat -r . b.txt
               foo
               bar
               $ cat b.txt
               foo
               bar
               $ hg status
-              M b.txt (known-bad-output !)
               $ hg debugrebuilddirstate
               $ hg status
-              M b.txt (known-bad-output !)
             the history was altered
             in theory p1/p2 order does not matter but in practice p1 == nullid is used as a
             marker that some metadata are present and should be fetched.
               $ hg debugrevlogindex b.txt
                  rev linkrev nodeid       p1           p2
 2 05b806ebe5ea 000000000000 000000000000
-3 a58b36ad6b65 05b806ebe5ea 000000000000 (known-bad-output !)
+3 a58b36ad6b65 000000000000 05b806ebe5ea
-3 a58b36ad6b65 000000000000 05b806ebe5ea (missing-correct-output !)
             Check commit Graph
               $ hg log -G
               @    changeset:   3:a1cc2bdca0aa
               |\   tag:         tip
               | |  parent:      2:615c6ccefd15
               | |  parent:      1:373d507f4667
               | |  user:        test
               | |  date:        Thu Jan 01 00:00:00 1970 +0000
               | |  summary:     c_merge_c: commit merge
               | |
               | o  changeset:   2:615c6ccefd15
               | |  parent:      0:f5a5a568022f
               | |  user:        test
               | |  date:        Thu Jan 01 00:00:00 1970 +0000
               | |  summary:     c_rename_c - rename and modify a.txt to b.txt
               | |
               o |  changeset:   1:373d507f4667
               |/   user:        test
               |    date:        Thu Jan 01 00:00:00 1970 +0000
               |    summary:     c_modify_c - modify a.txt
               |
               o  changeset:   0:f5a5a568022f
                  user:        test
                  date:        Thu Jan 01 00:00:00 1970 +0000
                  summary:     c_base_c - create a.txt

             #require no-reposimplestore
               $ . "$TESTDIR/narrow-library.sh"
             create full repo
               $ hg init master
               $ cd master
               $ cat >> .hg/hgrc <<EOF
               > [narrow]
               > serveellipses=True
               > EOF
               $ mkdir inside
               $ echo 1 > inside/f
               $ hg commit -Aqm 'initial inside'
               $ mkdir outside
               $ echo 1 > outside/f
               $ hg commit -Aqm 'initial outside'
               $ echo 2a > outside/f
               $ hg commit -Aqm 'outside 2a'
               $ echo 3 > inside/f
               $ hg commit -Aqm 'inside 3'
               $ echo 4a > outside/f
               $ hg commit -Aqm 'outside 4a'
               $ hg update '.~3'
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ echo 2b > outside/f
               $ hg commit -Aqm 'outside 2b'
               $ echo 3 > inside/f
               $ hg commit -Aqm 'inside 3'
               $ echo 4b > outside/f
               $ hg commit -Aqm 'outside 4b'
               $ hg update '.~3'
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ echo 2c > outside/f
               $ hg commit -Aqm 'outside 2c'
               $ echo 3 > inside/f
               $ hg commit -Aqm 'inside 3'
               $ echo 4c > outside/f
               $ hg commit -Aqm 'outside 4c'
               $ hg update '.~3'
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ echo 2d > outside/f
               $ hg commit -Aqm 'outside 2d'
               $ echo 3 > inside/f
               $ hg commit -Aqm 'inside 3'
               $ echo 4d > outside/f
               $ hg commit -Aqm 'outside 4d'
               $ hg update -r 'desc("outside 4a")'
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ hg merge -r 'desc("outside 4b")' 2>&1 | egrep -v '(warning:|incomplete!)'
               merging outside/f
 files updated, 0 files merged, 0 files removed, 1 files unresolved
               use 'hg resolve' to retry unresolved file merges or 'hg merge --abort' to abandon
               $ echo 5 > outside/f
               $ rm outside/f.orig
               $ hg resolve --mark outside/f
               (no more unresolved files)
               $ hg commit -m 'merge a/b 5'
               $ echo 6 > outside/f
               $ hg commit -Aqm 'outside 6'
               $ hg merge -r 'desc("outside 4c")' 2>&1 | egrep -v '(warning:|incomplete!)'
               merging outside/f
 files updated, 0 files merged, 0 files removed, 1 files unresolved
               use 'hg resolve' to retry unresolved file merges or 'hg merge --abort' to abandon
               $ echo 7 > outside/f
               $ rm outside/f.orig
               $ hg resolve --mark outside/f
               (no more unresolved files)
               $ hg commit -Aqm 'merge a/b/c 7'
               $ echo 8 > outside/f
               $ hg commit -Aqm 'outside 8'
               $ hg merge -r 'desc("outside 4d")' 2>&1 | egrep -v '(warning:|incomplete!)'
               merging outside/f
 files updated, 0 files merged, 0 files removed, 1 files unresolved
               use 'hg resolve' to retry unresolved file merges or 'hg merge --abort' to abandon
               $ echo 9 > outside/f
               $ rm outside/f.orig
               $ hg resolve --mark outside/f
               (no more unresolved files)
               $ hg commit -Aqm 'merge a/b/c/d 9'
               $ echo 10 > outside/f
               $ hg commit -Aqm 'outside 10'
               $ echo 11 > inside/f
               $ hg commit -Aqm 'inside 11'
               $ echo 12 > outside/f
               $ hg commit -Aqm 'outside 12'
               $ hg log -G -T '{rev} {node|short} {desc}\n'
               @  21 8d874d57adea outside 12
               |
               o  20 7ef88b4dd4fa inside 11
               |
               o  19 2a20009de83e outside 10
               |
               o    18 3ac1f5779de3 merge a/b/c/d 9
               |\
               | o  17 38a9c2f7e546 outside 8
               | |
               | o    16 094aa62fc898 merge a/b/c 7
               | |\
               | | o  15 f29d083d32e4 outside 6
               | | |
               | | o    14 2dc11382541d merge a/b 5
               | | |\
               o | | |  13 27d07ef97221 outside 4d
               | | | |
               o | | |  12 465567bdfb2d inside 3
               | | | |
               o | | |  11 d1c61993ec83 outside 2d
               | | | |
               | o | |  10 56859a8e33b9 outside 4c
               | | | |
               | o | |  9 bb96a08b062a inside 3
               | | | |
               | o | |  8 b844052e7b3b outside 2c
               |/ / /
               | | o  7 9db2d8fcc2a6 outside 4b
               | | |
               | | o  6 6418167787a6 inside 3
               | | |
               +---o  5 77344f344d83 outside 2b
               | |
               | o  4 9cadde08dc9f outside 4a
               | |
               | o  3 019ef06f125b inside 3
               | |
               | o  2 75e40c075a19 outside 2a
               |/
               o  1 906d6c682641 initial outside
               |
               o  0 9f8e82b51004 initial inside
             Now narrow and shallow clone this and get a hopefully correct graph
               $ cd ..
               $ hg clone --narrow ssh://user@dummy/master narrow --include inside --depth 7
               requesting all changes
               adding changesets
               adding manifests
               adding file changes
               added 8 changesets with 3 changes to 1 files
               new changesets *:* (glob)
               updating to branch default
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cd narrow
             To make updating the tests easier, we print the emitted nodes
             sorted. This makes it easier to identify when the same node structure
             has been emitted, just in a different order.
               $ hg log -G -T '{rev} {node|short}{if(ellipsis,"...")} {desc}\n'
               @  7 8d874d57adea... outside 12
               |
               o  6 7ef88b4dd4fa inside 11
               |
               o  5 2a20009de83e... outside 10
               |
               o    4 3ac1f5779de3... merge a/b/c/d 9
               |\
               | o  3 465567bdfb2d inside 3
               | |
               | o  2 d1c61993ec83... outside 2d
               |
               o  1 bb96a08b062a inside 3
               |
               o  0 b844052e7b3b... outside 2c
               $ hg log -T '{if(ellipsis,"...")}{node|short} {p1node|short} {p2node|short} {desc}\n' | sort
-              ...2a20009de83e 3ac1f5779de3 000000000000 outside 10
+              ...2a20009de83e 000000000000 3ac1f5779de3 outside 10
               ...3ac1f5779de3 bb96a08b062a 465567bdfb2d merge a/b/c/d 9
               ...8d874d57adea 7ef88b4dd4fa 000000000000 outside 12
               ...b844052e7b3b 000000000000 000000000000 outside 2c
               ...d1c61993ec83 000000000000 000000000000 outside 2d
 bdfb2d d1c61993ec83 000000000000 inside 3
 ef88b4dd4fa 2a20009de83e 000000000000 inside 11
               bb96a08b062a b844052e7b3b 000000000000 inside 3
               $ cd ..
             Incremental test case: show a pull can pull in a conflicted merge even if elided
               $ hg init pullmaster
               $ cd pullmaster
               $ cat >> .hg/hgrc <<EOF
               > [narrow]
               > serveellipses=True
               > EOF
               $ mkdir inside outside
               $ echo v1 > inside/f
               $ echo v1 > outside/f
               $ hg add inside/f outside/f
               $ hg commit -m init
               $ for line in a b c d
               > do
               > hg update -r 0
               > echo v2$line > outside/f
               > hg commit -m "outside 2$line"
               > echo v2$line > inside/f
               > hg commit -m "inside 2$line"
               > echo v3$line > outside/f
               > hg commit -m "outside 3$line"
               > echo v4$line > outside/f
               > hg commit -m "outside 4$line"
               > done
 files updated, 0 files merged, 0 files removed, 0 files unresolved
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               created new head
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               created new head
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               created new head
               $ cd ..
               $ hg clone --narrow ssh://user@dummy/pullmaster pullshallow \
               >          --include inside --depth 3
               requesting all changes
               adding changesets
               adding manifests
               adding file changes
               added 12 changesets with 5 changes to 1 files (+3 heads)
               new changesets *:* (glob)
               updating to branch default
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cd pullshallow
               $ hg log -G -T '{rev} {node|short}{if(ellipsis,"...")} {desc}\n'
               @  11 0ebbd712a0c8... outside 4d
               |
               o  10 0d4c867aeb23 inside 2d
               |
               o  9 e932969c3961... outside 2d
               o  8 33d530345455... outside 4c
               |
               o  7 0ce6481bfe07 inside 2c
               |
               o  6 caa65c940632... outside 2c
               o  5 3df233defecc... outside 4b
               |
               o  4 7162cc6d11a4 inside 2b
               |
               o  3 f2a632f0082d... outside 2b
               o  2 b8a3da16ba49... outside 4a
               |
               o  1 53f543eb8e45 inside 2a
               |
               o  0 1be3e5221c6a... outside 2a
               $ hg log -T '{if(ellipsis,"...")}{node|short} {p1node|short} {p2node|short} {desc}\n' | sort
               ...0ebbd712a0c8 0d4c867aeb23 000000000000 outside 4d
               ...1be3e5221c6a 000000000000 000000000000 outside 2a
               ...33d530345455 0ce6481bfe07 000000000000 outside 4c
               ...3df233defecc 7162cc6d11a4 000000000000 outside 4b
               ...b8a3da16ba49 53f543eb8e45 000000000000 outside 4a
               ...caa65c940632 000000000000 000000000000 outside 2c
               ...e932969c3961 000000000000 000000000000 outside 2d
               ...f2a632f0082d 000000000000 000000000000 outside 2b
 ce6481bfe07 caa65c940632 000000000000 inside 2c
 d4c867aeb23 e932969c3961 000000000000 inside 2d
 f543eb8e45 1be3e5221c6a 000000000000 inside 2a
 cc6d11a4 f2a632f0082d 000000000000 inside 2b
               $ cd ../pullmaster
               $ hg update -r 'desc("outside 4a")'
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ hg merge -r 'desc("outside 4b")' 2>&1 | egrep -v '(warning:|incomplete!)'
               merging inside/f
               merging outside/f
 files updated, 0 files merged, 0 files removed, 2 files unresolved
               use 'hg resolve' to retry unresolved file merges or 'hg merge --abort' to abandon
               $ echo 3 > inside/f
               $ echo 5 > outside/f
               $ rm -f {in,out}side/f.orig
               $ hg resolve --mark inside/f outside/f
               (no more unresolved files)
               $ hg commit -m 'merge a/b 5'
               $ hg update -r 'desc("outside 4c")'
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ hg merge -r 'desc("outside 4d")' 2>&1 | egrep -v '(warning:|incomplete!)'
               merging inside/f
               merging outside/f
 files updated, 0 files merged, 0 files removed, 2 files unresolved
               use 'hg resolve' to retry unresolved file merges or 'hg merge --abort' to abandon
               $ echo 3 > inside/f
               $ echo 5 > outside/f
               $ rm -f {in,out}side/f.orig
               $ hg resolve --mark inside/f outside/f
               (no more unresolved files)
               $ hg commit -m 'merge c/d 5'
               $ hg update -r 'desc("merge a/b 5")'
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ hg merge -r 'desc("merge c/d 5")'
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               (branch merge, don't forget to commit)
               $ echo 6 > outside/f
               $ hg commit -m 'outside 6'
               $ echo 7 > outside/f
               $ hg commit -m 'outside 7'
               $ echo 8 > outside/f
               $ hg commit -m 'outside 8'
               $ cd ../pullshallow
               $ hg pull --depth 3
               pulling from ssh://user@dummy/pullmaster
               searching for changes
               adding changesets
               adding manifests
               adding file changes
               added 4 changesets with 3 changes to 1 files (-3 heads)
               new changesets *:* (glob)
               (run 'hg update' to get a working copy)
               $ hg log -T '{if(ellipsis,"...")}{node|short} {p1node|short} {p2node|short} {desc}\n' | sort
               ...0ebbd712a0c8 0d4c867aeb23 000000000000 outside 4d
               ...1be3e5221c6a 000000000000 000000000000 outside 2a
               ...33d530345455 0ce6481bfe07 000000000000 outside 4c
               ...3df233defecc 7162cc6d11a4 000000000000 outside 4b
               ...b8a3da16ba49 53f543eb8e45 000000000000 outside 4a
               ...bf545653453e 968003d40c60 000000000000 outside 8
               ...caa65c940632 000000000000 000000000000 outside 2c
               ...e932969c3961 000000000000 000000000000 outside 2d
               ...f2a632f0082d 000000000000 000000000000 outside 2b
 ce6481bfe07 caa65c940632 000000000000 inside 2c
 d4c867aeb23 e932969c3961 000000000000 inside 2d
 f543eb8e45 1be3e5221c6a 000000000000 inside 2a
 d49c0bdbda b8a3da16ba49 3df233defecc merge a/b 5
 cc6d11a4 f2a632f0082d 000000000000 inside 2b
 d40c60 67d49c0bdbda e867021d52c2 outside 6
               e867021d52c2 33d530345455 0ebbd712a0c8 merge c/d 5