upstream/mercurial-mirror Commit - r52147:f94c1033

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

# coding: utf8

2

# coding: utf8

3

#

3

#

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

"""Storage back-end for Mercurial.

9

"""Storage back-end for Mercurial.

10

11

This provides efficient delta storage with O(1) retrieve and append

11

This provides efficient delta storage with O(1) retrieve and append

12

and O(changes) merge between branches.

12

and O(changes) merge between branches.

13

"""

13

"""

14

15

16

import binascii

16

import binascii

17

import collections

17

import collections

18

import contextlib

18

import contextlib

19

import functools

19

import functools

20

import io

20

import io

21

import os

21

import os

22

import struct

22

import struct

23

import weakref

23

import weakref

24

import zlib

24

import zlib

25

26

# import stuff from node for others to import from revlog

26

# import stuff from node for others to import from revlog

27

from .node import (

27

from .node import (

28

bin,

28

bin,

29

hex,

29

hex,

30

nullrev,

30

nullrev,

31

sha1nodeconstants,

31

sha1nodeconstants,

32

short,

32

short,

33

wdirrev,

33

wdirrev,

34

)

34

)

35

from .i18n import _

35

from .i18n import _

36

from .revlogutils.constants import (

36

from .revlogutils.constants import (

37

ALL_KINDS,

37

ALL_KINDS,

38

CHANGELOGV2,

38

CHANGELOGV2,

39

COMP_MODE_DEFAULT,

39

COMP_MODE_DEFAULT,

40

COMP_MODE_INLINE,

40

COMP_MODE_INLINE,

41

COMP_MODE_PLAIN,

41

COMP_MODE_PLAIN,

42

DELTA_BASE_REUSE_NO,

42

DELTA_BASE_REUSE_NO,

43

DELTA_BASE_REUSE_TRY,

43

DELTA_BASE_REUSE_TRY,

44

ENTRY_RANK,

44

ENTRY_RANK,

45

FEATURES_BY_VERSION,

45

FEATURES_BY_VERSION,

46

FLAG_GENERALDELTA,

46

FLAG_GENERALDELTA,

47

FLAG_INLINE_DATA,

47

FLAG_INLINE_DATA,

48

INDEX_HEADER,

48

INDEX_HEADER,

49

KIND_CHANGELOG,

49

KIND_CHANGELOG,

50

KIND_FILELOG,

50

KIND_FILELOG,

51

RANK_UNKNOWN,

51

RANK_UNKNOWN,

52

REVLOGV0,

52

REVLOGV0,

53

REVLOGV1,

53

REVLOGV1,

54

REVLOGV1_FLAGS,

54

REVLOGV1_FLAGS,

55

REVLOGV2,

55

REVLOGV2,

56

REVLOGV2_FLAGS,

56

REVLOGV2_FLAGS,

57

REVLOG_DEFAULT_FLAGS,

57

REVLOG_DEFAULT_FLAGS,

58

REVLOG_DEFAULT_FORMAT,

58

REVLOG_DEFAULT_FORMAT,

59

REVLOG_DEFAULT_VERSION,

59

REVLOG_DEFAULT_VERSION,

60

SUPPORTED_FLAGS,

60

SUPPORTED_FLAGS,

61

)

61

)

62

from .revlogutils.flagutil import (

62

from .revlogutils.flagutil import (

63

REVIDX_DEFAULT_FLAGS,

63

REVIDX_DEFAULT_FLAGS,

64

REVIDX_ELLIPSIS,

64

REVIDX_ELLIPSIS,

65

REVIDX_EXTSTORED,

65

REVIDX_EXTSTORED,

66

REVIDX_FLAGS_ORDER,

66

REVIDX_FLAGS_ORDER,

67

REVIDX_HASCOPIESINFO,

67

REVIDX_HASCOPIESINFO,

68

REVIDX_ISCENSORED,

68

REVIDX_ISCENSORED,

69

REVIDX_RAWTEXT_CHANGING_FLAGS,

69

REVIDX_RAWTEXT_CHANGING_FLAGS,

70

)

70

)

71

from .thirdparty import attr

71

from .thirdparty import attr

72

from . import (

72

from . import (

73

ancestor,

73

ancestor,

74

dagop,

74

dagop,

75

error,

75

error,

76

mdiff,

76

mdiff,

77

policy,

77

policy,

78

pycompat,

78

pycompat,

79

revlogutils,

79

revlogutils,

80

templatefilters,

80

templatefilters,

81

util,

81

util,

82

)

82

)

83

from .interfaces import (

83

from .interfaces import (

84

repository,

84

repository,

85

util as interfaceutil,

85

util as interfaceutil,

86

)

86

)

87

from .revlogutils import (

87

from .revlogutils import (

88

deltas as deltautil,

88

deltas as deltautil,

89

docket as docketutil,

89

docket as docketutil,

90

flagutil,

90

flagutil,

91

nodemap as nodemaputil,

91

nodemap as nodemaputil,

92

randomaccessfile,

92

randomaccessfile,

93

revlogv0,

93

revlogv0,

94

rewrite,

94

rewrite,

95

sidedata as sidedatautil,

95

sidedata as sidedatautil,

96

)

96

)

97

from .utils import (

97

from .utils import (

98

storageutil,

98

storageutil,

99

stringutil,

99

stringutil,

100

)

100

)

101

102

# blanked usage of all the name to prevent pyflakes constraints

102

# blanked usage of all the name to prevent pyflakes constraints

103

# We need these name available in the module for extensions.

103

# We need these name available in the module for extensions.

104

105

REVLOGV0

105

REVLOGV0

106

REVLOGV1

106

REVLOGV1

107

REVLOGV2

107

REVLOGV2

108

CHANGELOGV2

108

CHANGELOGV2

109

FLAG_INLINE_DATA

109

FLAG_INLINE_DATA

110

FLAG_GENERALDELTA

110

FLAG_GENERALDELTA

111

REVLOG_DEFAULT_FLAGS

111

REVLOG_DEFAULT_FLAGS

112

REVLOG_DEFAULT_FORMAT

112

REVLOG_DEFAULT_FORMAT

113

REVLOG_DEFAULT_VERSION

113

REVLOG_DEFAULT_VERSION

114

REVLOGV1_FLAGS

114

REVLOGV1_FLAGS

115

REVLOGV2_FLAGS

115

REVLOGV2_FLAGS

116

REVIDX_ISCENSORED

116

REVIDX_ISCENSORED

117

REVIDX_ELLIPSIS

117

REVIDX_ELLIPSIS

118

REVIDX_HASCOPIESINFO

118

REVIDX_HASCOPIESINFO

119

REVIDX_EXTSTORED

119

REVIDX_EXTSTORED

120

REVIDX_DEFAULT_FLAGS

120

REVIDX_DEFAULT_FLAGS

121

REVIDX_FLAGS_ORDER

121

REVIDX_FLAGS_ORDER

122

REVIDX_RAWTEXT_CHANGING_FLAGS

122

REVIDX_RAWTEXT_CHANGING_FLAGS

123

124

parsers = policy.importmod('parsers')

124

parsers = policy.importmod('parsers')

125

rustancestor = policy.importrust('ancestor')

125

rustancestor = policy.importrust('ancestor')

126

rustdagop = policy.importrust('dagop')

126

rustdagop = policy.importrust('dagop')

127

rustrevlog = policy.importrust('revlog')

127

rustrevlog = policy.importrust('revlog')

128

129

# Aliased for performance.

129

# Aliased for performance.

130

_zlibdecompress = zlib.decompress

130

_zlibdecompress = zlib.decompress

131

132

# max size of inline data embedded into a revlog

132

# max size of inline data embedded into a revlog

133

_maxinline = 131072

133

_maxinline = 131072

134

135

# Flag processors for REVIDX_ELLIPSIS.

135

# Flag processors for REVIDX_ELLIPSIS.

136

def ellipsisreadprocessor(rl, text):

136

def ellipsisreadprocessor(rl, text):

137

return text, False

137

return text, False

138

139

140

def ellipsiswriteprocessor(rl, text):

140

def ellipsiswriteprocessor(rl, text):

141

return text, False

141

return text, False

142

143

144

def ellipsisrawprocessor(rl, text):

144

def ellipsisrawprocessor(rl, text):

145

return False

145

return False

146

147

148

ellipsisprocessor = (

148

ellipsisprocessor = (

149

ellipsisreadprocessor,

149

ellipsisreadprocessor,

150

ellipsiswriteprocessor,

150

ellipsiswriteprocessor,

151

ellipsisrawprocessor,

151

ellipsisrawprocessor,

152

)

152

)

153

154

155

def _verify_revision(rl, skipflags, state, node):

155

def _verify_revision(rl, skipflags, state, node):

156

"""Verify the integrity of the given revlog ``node`` while providing a hook

156

"""Verify the integrity of the given revlog ``node`` while providing a hook

157

point for extensions to influence the operation."""

157

point for extensions to influence the operation."""

158

if skipflags:

158

if skipflags:

159

state[b'skipread'].add(node)

159

state[b'skipread'].add(node)

160

else:

160

else:

161

# Side-effect: read content and verify hash.

161

# Side-effect: read content and verify hash.

162

rl.revision(node)

162

rl.revision(node)

163

164

165

# True if a fast implementation for persistent-nodemap is available

165

# True if a fast implementation for persistent-nodemap is available

166

#

166

#

167

# We also consider we have a "fast" implementation in "pure" python because

167

# We also consider we have a "fast" implementation in "pure" python because

168

# people using pure don't really have performance consideration (and a

168

# people using pure don't really have performance consideration (and a

169

# wheelbarrow of other slowness source)

169

# wheelbarrow of other slowness source)

170

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

170

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

171

parsers, 'BaseIndexObject'

171

parsers, 'BaseIndexObject'

172

)

172

)

173

174

175

@interfaceutil.implementer(repository.irevisiondelta)

175

@interfaceutil.implementer(repository.irevisiondelta)

176

@attr.s(slots=True)

176

@attr.s(slots=True)

177

class revlogrevisiondelta:

177

class revlogrevisiondelta:

178

node = attr.ib()

178

node = attr.ib()

179

p1node = attr.ib()

179

p1node = attr.ib()

180

p2node = attr.ib()

180

p2node = attr.ib()

181

basenode = attr.ib()

181

basenode = attr.ib()

182

flags = attr.ib()

182

flags = attr.ib()

183

baserevisionsize = attr.ib()

183

baserevisionsize = attr.ib()

184

revision = attr.ib()

184

revision = attr.ib()

185

delta = attr.ib()

185

delta = attr.ib()

186

sidedata = attr.ib()

186

sidedata = attr.ib()

187

protocol_flags = attr.ib()

187

protocol_flags = attr.ib()

188

linknode = attr.ib(default=None)

188

linknode = attr.ib(default=None)

189

190

191

@interfaceutil.implementer(repository.iverifyproblem)

191

@interfaceutil.implementer(repository.iverifyproblem)

192

@attr.s(frozen=True)

192

@attr.s(frozen=True)

193

class revlogproblem:

193

class revlogproblem:

194

warning = attr.ib(default=None)

194

warning = attr.ib(default=None)

195

error = attr.ib(default=None)

195

error = attr.ib(default=None)

196

node = attr.ib(default=None)

196

node = attr.ib(default=None)

197

198

199

def parse_index_v1(data, inline):

199

def parse_index_v1(data, inline):

200

# call the C implementation to parse the index data

200

# call the C implementation to parse the index data

201

index, cache = parsers.parse_index2(data, inline)

201

index, cache = parsers.parse_index2(data, inline)

202

return index, cache

202

return index, cache

203

204

205

def parse_index_v2(data, inline):

205

def parse_index_v2(data, inline):

206

# call the C implementation to parse the index data

206

# call the C implementation to parse the index data

207

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

207

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

208

return index, cache

208

return index, cache

209

210

211

def parse_index_cl_v2(data, inline):

211

def parse_index_cl_v2(data, inline):

212

# call the C implementation to parse the index data

212

# call the C implementation to parse the index data

213

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

213

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

214

return index, cache

214

return index, cache

215

216

217

if hasattr(parsers, 'parse_index_devel_nodemap'):

217

if hasattr(parsers, 'parse_index_devel_nodemap'):

218

219

def parse_index_v1_nodemap(data, inline):

219

def parse_index_v1_nodemap(data, inline):

220

index, cache = parsers.parse_index_devel_nodemap(data, inline)

220

index, cache = parsers.parse_index_devel_nodemap(data, inline)

221

return index, cache

221

return index, cache

222

223

224

else:

224

else:

225

parse_index_v1_nodemap = None

225

parse_index_v1_nodemap = None

226

227

228

def parse_index_v1_~~mixed~~(data, inline, default_header):

228

def parse_index_v1_rust(data, inline, default_header):

229

cache = (0, data) if inline else None

229

cache = (0, data) if inline else None

230

return rustrevlog.~~Mixed~~Index(data, default_header), cache

230

return rustrevlog.Index(data, default_header), cache

231

232

233

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

233

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

234

# signed integer)

234

# signed integer)

235

_maxentrysize = 0x7FFFFFFF

235

_maxentrysize = 0x7FFFFFFF

236

237

FILE_TOO_SHORT_MSG = _(

237

FILE_TOO_SHORT_MSG = _(

238

b'cannot read from revlog %s;'

238

b'cannot read from revlog %s;'

239

b' expected %d bytes from offset %d, data size is %d'

239

b' expected %d bytes from offset %d, data size is %d'

240

)

240

)

241

242

hexdigits = b'0123456789abcdefABCDEF'

242

hexdigits = b'0123456789abcdefABCDEF'

243

244

245

class _Config:

245

class _Config:

246

def copy(self):

246

def copy(self):

247

return self.__class__(**self.__dict__)

247

return self.__class__(**self.__dict__)

248

249

250

@attr.s()

250

@attr.s()

251

class FeatureConfig(_Config):

251

class FeatureConfig(_Config):

252

"""Hold configuration values about the available revlog features"""

252

"""Hold configuration values about the available revlog features"""

253

254

# the default compression engine

254

# the default compression engine

255

compression_engine = attr.ib(default=b'zlib')

255

compression_engine = attr.ib(default=b'zlib')

256

# compression engines options

256

# compression engines options

257

compression_engine_options = attr.ib(default=attr.Factory(dict))

257

compression_engine_options = attr.ib(default=attr.Factory(dict))

258

259

# can we use censor on this revlog

259

# can we use censor on this revlog

260

censorable = attr.ib(default=False)

260

censorable = attr.ib(default=False)

261

# does this revlog use the "side data" feature

261

# does this revlog use the "side data" feature

262

has_side_data = attr.ib(default=False)

262

has_side_data = attr.ib(default=False)

263

# might remove rank configuration once the computation has no impact

263

# might remove rank configuration once the computation has no impact

264

compute_rank = attr.ib(default=False)

264

compute_rank = attr.ib(default=False)

265

# parent order is supposed to be semantically irrelevant, so we

265

# parent order is supposed to be semantically irrelevant, so we

266

# normally resort parents to ensure that the first parent is non-null,

266

# normally resort parents to ensure that the first parent is non-null,

267

# if there is a non-null parent at all.

267

# if there is a non-null parent at all.

268

# filelog abuses the parent order as flag to mark some instances of

268

# filelog abuses the parent order as flag to mark some instances of

269

# meta-encoded files, so allow it to disable this behavior.

269

# meta-encoded files, so allow it to disable this behavior.

270

canonical_parent_order = attr.ib(default=False)

270

canonical_parent_order = attr.ib(default=False)

271

# can ellipsis commit be used

271

# can ellipsis commit be used

272

enable_ellipsis = attr.ib(default=False)

272

enable_ellipsis = attr.ib(default=False)

273

274

def copy(self):

274

def copy(self):

275

new = super().copy()

275

new = super().copy()

276

new.compression_engine_options = self.compression_engine_options.copy()

276

new.compression_engine_options = self.compression_engine_options.copy()

277

return new

277

return new

278

279

280

@attr.s()

280

@attr.s()

281

class DataConfig(_Config):

281

class DataConfig(_Config):

282

"""Hold configuration value about how the revlog data are read"""

282

"""Hold configuration value about how the revlog data are read"""

283

284

# should we try to open the "pending" version of the revlog

284

# should we try to open the "pending" version of the revlog

285

try_pending = attr.ib(default=False)

285

try_pending = attr.ib(default=False)

286

# should we try to open the "splitted" version of the revlog

286

# should we try to open the "splitted" version of the revlog

287

try_split = attr.ib(default=False)

287

try_split = attr.ib(default=False)

288

# When True, indexfile should be opened with checkambig=True at writing,

288

# When True, indexfile should be opened with checkambig=True at writing,

289

# to avoid file stat ambiguity.

289

# to avoid file stat ambiguity.

290

check_ambig = attr.ib(default=False)

290

check_ambig = attr.ib(default=False)

291

292

# If true, use mmap instead of reading to deal with large index

292

# If true, use mmap instead of reading to deal with large index

293

mmap_large_index = attr.ib(default=False)

293

mmap_large_index = attr.ib(default=False)

294

# how much data is large

294

# how much data is large

295

mmap_index_threshold = attr.ib(default=None)

295

mmap_index_threshold = attr.ib(default=None)

296

# How much data to read and cache into the raw revlog data cache.

296

# How much data to read and cache into the raw revlog data cache.

297

chunk_cache_size = attr.ib(default=65536)

297

chunk_cache_size = attr.ib(default=65536)

298

299

# The size of the uncompressed cache compared to the largest revision seen.

299

# The size of the uncompressed cache compared to the largest revision seen.

300

uncompressed_cache_factor = attr.ib(default=None)

300

uncompressed_cache_factor = attr.ib(default=None)

301

302

# The number of chunk cached

302

# The number of chunk cached

303

uncompressed_cache_count = attr.ib(default=None)

303

uncompressed_cache_count = attr.ib(default=None)

304

305

# Allow sparse reading of the revlog data

305

# Allow sparse reading of the revlog data

306

with_sparse_read = attr.ib(default=False)

306

with_sparse_read = attr.ib(default=False)

307

# minimal density of a sparse read chunk

307

# minimal density of a sparse read chunk

308

sr_density_threshold = attr.ib(default=0.50)

308

sr_density_threshold = attr.ib(default=0.50)

309

# minimal size of data we skip when performing sparse read

309

# minimal size of data we skip when performing sparse read

310

sr_min_gap_size = attr.ib(default=262144)

310

sr_min_gap_size = attr.ib(default=262144)

311

312

# are delta encoded against arbitrary bases.

312

# are delta encoded against arbitrary bases.

313

generaldelta = attr.ib(default=False)

313

generaldelta = attr.ib(default=False)

314

315

316

@attr.s()

316

@attr.s()

317

class DeltaConfig(_Config):

317

class DeltaConfig(_Config):

318

"""Hold configuration value about how new delta are computed

318

"""Hold configuration value about how new delta are computed

319

320

Some attributes are duplicated from DataConfig to help havign each object

320

Some attributes are duplicated from DataConfig to help havign each object

321

self contained.

321

self contained.

322

"""

322

"""

323

324

# can delta be encoded against arbitrary bases.

324

# can delta be encoded against arbitrary bases.

325

general_delta = attr.ib(default=False)

325

general_delta = attr.ib(default=False)

326

# Allow sparse writing of the revlog data

326

# Allow sparse writing of the revlog data

327

sparse_revlog = attr.ib(default=False)

327

sparse_revlog = attr.ib(default=False)

328

# maximum length of a delta chain

328

# maximum length of a delta chain

329

max_chain_len = attr.ib(default=None)

329

max_chain_len = attr.ib(default=None)

330

# Maximum distance between delta chain base start and end

330

# Maximum distance between delta chain base start and end

331

max_deltachain_span = attr.ib(default=-1)

331

max_deltachain_span = attr.ib(default=-1)

332

# If `upper_bound_comp` is not None, this is the expected maximal gain from

332

# If `upper_bound_comp` is not None, this is the expected maximal gain from

333

# compression for the data content.

333

# compression for the data content.

334

upper_bound_comp = attr.ib(default=None)

334

upper_bound_comp = attr.ib(default=None)

335

# Should we try a delta against both parent

335

# Should we try a delta against both parent

336

delta_both_parents = attr.ib(default=True)

336

delta_both_parents = attr.ib(default=True)

337

# Test delta base candidate group by chunk of this maximal size.

337

# Test delta base candidate group by chunk of this maximal size.

338

candidate_group_chunk_size = attr.ib(default=0)

338

candidate_group_chunk_size = attr.ib(default=0)

339

# Should we display debug information about delta computation

339

# Should we display debug information about delta computation

340

debug_delta = attr.ib(default=False)

340

debug_delta = attr.ib(default=False)

341

# trust incoming delta by default

341

# trust incoming delta by default

342

lazy_delta = attr.ib(default=True)

342

lazy_delta = attr.ib(default=True)

343

# trust the base of incoming delta by default

343

# trust the base of incoming delta by default

344

lazy_delta_base = attr.ib(default=False)

344

lazy_delta_base = attr.ib(default=False)

345

346

347

class _InnerRevlog:

347

class _InnerRevlog:

348

"""An inner layer of the revlog object

348

"""An inner layer of the revlog object

349

350

That layer exist to be able to delegate some operation to Rust, its

350

That layer exist to be able to delegate some operation to Rust, its

351

boundaries are arbitrary and based on what we can delegate to Rust.

351

boundaries are arbitrary and based on what we can delegate to Rust.

352

"""

352

"""

353

354

def __init__(

354

def __init__(

355

self,

355

self,

356

opener,

356

opener,

357

index,

357

index,

358

index_file,

358

index_file,

359

data_file,

359

data_file,

360

sidedata_file,

360

sidedata_file,

361

inline,

361

inline,

362

data_config,

362

data_config,

363

delta_config,

363

delta_config,

364

feature_config,

364

feature_config,

365

chunk_cache,

365

chunk_cache,

366

default_compression_header,

366

default_compression_header,

367

):

367

):

368

self.opener = opener

368

self.opener = opener

369

self.index = index

369

self.index = index

370

371

self.index_file = index_file

371

self.index_file = index_file

372

self.data_file = data_file

372

self.data_file = data_file

373

self.sidedata_file = sidedata_file

373

self.sidedata_file = sidedata_file

374

self.inline = inline

374

self.inline = inline

375

self.data_config = data_config

375

self.data_config = data_config

376

self.delta_config = delta_config

376

self.delta_config = delta_config

377

self.feature_config = feature_config

377

self.feature_config = feature_config

378

379

# used during diverted write.

379

# used during diverted write.

380

self._orig_index_file = None

380

self._orig_index_file = None

381

382

self._default_compression_header = default_compression_header

382

self._default_compression_header = default_compression_header

383

384

# index

384

# index

385

386

# 3-tuple of file handles being used for active writing.

386

# 3-tuple of file handles being used for active writing.

387

self._writinghandles = None

387

self._writinghandles = None

388

389

self._segmentfile = randomaccessfile.randomaccessfile(

389

self._segmentfile = randomaccessfile.randomaccessfile(

390

self.opener,

390

self.opener,

391

(self.index_file if self.inline else self.data_file),

391

(self.index_file if self.inline else self.data_file),

392

self.data_config.chunk_cache_size,

392

self.data_config.chunk_cache_size,

393

chunk_cache,

393

chunk_cache,

394

)

394

)

395

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

395

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

396

self.opener,

396

self.opener,

397

self.sidedata_file,

397

self.sidedata_file,

398

self.data_config.chunk_cache_size,

398

self.data_config.chunk_cache_size,

399

)

399

)

400

401

# revlog header -> revlog compressor

401

# revlog header -> revlog compressor

402

self._decompressors = {}

402

self._decompressors = {}

403

# 3-tuple of (node, rev, text) for a raw revision.

403

# 3-tuple of (node, rev, text) for a raw revision.

404

self._revisioncache = None

404

self._revisioncache = None

405

406

# cache some uncompressed chunks

406

# cache some uncompressed chunks

407

# rev → uncompressed_chunk

407

# rev → uncompressed_chunk

408

#

408

#

409

# the max cost is dynamically updated to be proportionnal to the

409

# the max cost is dynamically updated to be proportionnal to the

410

# size of revision we actually encounter.

410

# size of revision we actually encounter.

411

self._uncompressed_chunk_cache = None

411

self._uncompressed_chunk_cache = None

412

if self.data_config.uncompressed_cache_factor is not None:

412

if self.data_config.uncompressed_cache_factor is not None:

413

self._uncompressed_chunk_cache = util.lrucachedict(

413

self._uncompressed_chunk_cache = util.lrucachedict(

414

self.data_config.uncompressed_cache_count,

414

self.data_config.uncompressed_cache_count,

415

maxcost=65536, # some arbitrary initial value

415

maxcost=65536, # some arbitrary initial value

416

)

416

)

417

418

self._delay_buffer = None

418

self._delay_buffer = None

419

420

def __len__(self):

420

def __len__(self):

421

return len(self.index)

421

return len(self.index)

422

423

def clear_cache(self):

423

def clear_cache(self):

424

assert not self.is_delaying

424

assert not self.is_delaying

425

self._revisioncache = None

425

self._revisioncache = None

426

if self._uncompressed_chunk_cache is not None:

426

if self._uncompressed_chunk_cache is not None:

427

self._uncompressed_chunk_cache.clear()

427

self._uncompressed_chunk_cache.clear()

428

self._segmentfile.clear_cache()

428

self._segmentfile.clear_cache()

429

self._segmentfile_sidedata.clear_cache()

429

self._segmentfile_sidedata.clear_cache()

430

431

@property

431

@property

432

def canonical_index_file(self):

432

def canonical_index_file(self):

433

if self._orig_index_file is not None:

433

if self._orig_index_file is not None:

434

return self._orig_index_file

434

return self._orig_index_file

435

return self.index_file

435

return self.index_file

436

437

@property

437

@property

438

def is_delaying(self):

438

def is_delaying(self):

439

"""is the revlog is currently delaying the visibility of written data?

439

"""is the revlog is currently delaying the visibility of written data?

440

441

The delaying mechanism can be either in-memory or written on disk in a

441

The delaying mechanism can be either in-memory or written on disk in a

442

side-file."""

442

side-file."""

443

return (self._delay_buffer is not None) or (

443

return (self._delay_buffer is not None) or (

444

self._orig_index_file is not None

444

self._orig_index_file is not None

445

)

445

)

446

447

# Derived from index values.

447

# Derived from index values.

448

449

def start(self, rev):

449

def start(self, rev):

450

"""the offset of the data chunk for this revision"""

450

"""the offset of the data chunk for this revision"""

451

return int(self.index[rev][0] >> 16)

451

return int(self.index[rev][0] >> 16)

452

453

def length(self, rev):

453

def length(self, rev):

454

"""the length of the data chunk for this revision"""

454

"""the length of the data chunk for this revision"""

455

return self.index[rev][1]

455

return self.index[rev][1]

456

457

def end(self, rev):

457

def end(self, rev):

458

"""the end of the data chunk for this revision"""

458

"""the end of the data chunk for this revision"""

459

return self.start(rev) + self.length(rev)

459

return self.start(rev) + self.length(rev)

460

461

def deltaparent(self, rev):

461

def deltaparent(self, rev):

462

"""return deltaparent of the given revision"""

462

"""return deltaparent of the given revision"""

463

base = self.index[rev][3]

463

base = self.index[rev][3]

464

if base == rev:

464

if base == rev:

465

return nullrev

465

return nullrev

466

elif self.delta_config.general_delta:

466

elif self.delta_config.general_delta:

467

return base

467

return base

468

else:

468

else:

469

return rev - 1

469

return rev - 1

470

471

def issnapshot(self, rev):

471

def issnapshot(self, rev):

472

"""tells whether rev is a snapshot"""

472

"""tells whether rev is a snapshot"""

473

if not self.delta_config.sparse_revlog:

473

if not self.delta_config.sparse_revlog:

474

return self.deltaparent(rev) == nullrev

474

return self.deltaparent(rev) == nullrev

475

elif hasattr(self.index, 'issnapshot'):

475

elif hasattr(self.index, 'issnapshot'):

476

# directly assign the method to cache the testing and access

476

# directly assign the method to cache the testing and access

477

self.issnapshot = self.index.issnapshot

477

self.issnapshot = self.index.issnapshot

478

return self.issnapshot(rev)

478

return self.issnapshot(rev)

479

if rev == nullrev:

479

if rev == nullrev:

480

return True

480

return True

481

entry = self.index[rev]

481

entry = self.index[rev]

482

base = entry[3]

482

base = entry[3]

483

if base == rev:

483

if base == rev:

484

return True

484

return True

485

if base == nullrev:

485

if base == nullrev:

486

return True

486

return True

487

p1 = entry[5]

487

p1 = entry[5]

488

while self.length(p1) == 0:

488

while self.length(p1) == 0:

489

b = self.deltaparent(p1)

489

b = self.deltaparent(p1)

490

if b == p1:

490

if b == p1:

491

break

491

break

492

p1 = b

492

p1 = b

493

p2 = entry[6]

493

p2 = entry[6]

494

while self.length(p2) == 0:

494

while self.length(p2) == 0:

495

b = self.deltaparent(p2)

495

b = self.deltaparent(p2)

496

if b == p2:

496

if b == p2:

497

break

497

break

498

p2 = b

498

p2 = b

499

if base == p1 or base == p2:

499

if base == p1 or base == p2:

500

return False

500

return False

501

return self.issnapshot(base)

501

return self.issnapshot(base)

502

503

def _deltachain(self, rev, stoprev=None):

503

def _deltachain(self, rev, stoprev=None):

504

"""Obtain the delta chain for a revision.

504

"""Obtain the delta chain for a revision.

505

506

``stoprev`` specifies a revision to stop at. If not specified, we

506

``stoprev`` specifies a revision to stop at. If not specified, we

507

stop at the base of the chain.

507

stop at the base of the chain.

508

509

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

509

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

510

revs in ascending order and ``stopped`` is a bool indicating whether

510

revs in ascending order and ``stopped`` is a bool indicating whether

511

``stoprev`` was hit.

511

``stoprev`` was hit.

512

"""

512

"""

513

generaldelta = self.delta_config.general_delta

513

generaldelta = self.delta_config.general_delta

514

# Try C implementation.

514

# Try C implementation.

515

try:

515

try:

516

return self.index.deltachain(rev, stoprev, generaldelta)

516

return self.index.deltachain(rev, stoprev, generaldelta)

517

except AttributeError:

517

except AttributeError:

518

pass

518

pass

519

520

chain = []

520

chain = []

521

522

# Alias to prevent attribute lookup in tight loop.

522

# Alias to prevent attribute lookup in tight loop.

523

index = self.index

523

index = self.index

524

525

iterrev = rev

525

iterrev = rev

526

e = index[iterrev]

526

e = index[iterrev]

527

while iterrev != e[3] and iterrev != stoprev:

527

while iterrev != e[3] and iterrev != stoprev:

528

chain.append(iterrev)

528

chain.append(iterrev)

529

if generaldelta:

529

if generaldelta:

530

iterrev = e[3]

530

iterrev = e[3]

531

else:

531

else:

532

iterrev -= 1

532

iterrev -= 1

533

e = index[iterrev]

533

e = index[iterrev]

534

535

if iterrev == stoprev:

535

if iterrev == stoprev:

536

stopped = True

536

stopped = True

537

else:

537

else:

538

chain.append(iterrev)

538

chain.append(iterrev)

539

stopped = False

539

stopped = False

540

541

chain.reverse()

541

chain.reverse()

542

return chain, stopped

542

return chain, stopped

543

544

@util.propertycache

544

@util.propertycache

545

def _compressor(self):

545

def _compressor(self):

546

engine = util.compengines[self.feature_config.compression_engine]

546

engine = util.compengines[self.feature_config.compression_engine]

547

return engine.revlogcompressor(

547

return engine.revlogcompressor(

548

self.feature_config.compression_engine_options

548

self.feature_config.compression_engine_options

549

)

549

)

550

551

@util.propertycache

551

@util.propertycache

552

def _decompressor(self):

552

def _decompressor(self):

553

"""the default decompressor"""

553

"""the default decompressor"""

554

if self._default_compression_header is None:

554

if self._default_compression_header is None:

555

return None

555

return None

556

t = self._default_compression_header

556

t = self._default_compression_header

557

c = self._get_decompressor(t)

557

c = self._get_decompressor(t)

558

return c.decompress

558

return c.decompress

559

560

def _get_decompressor(self, t):

560

def _get_decompressor(self, t):

561

try:

561

try:

562

compressor = self._decompressors[t]

562

compressor = self._decompressors[t]

563

except KeyError:

563

except KeyError:

564

try:

564

try:

565

engine = util.compengines.forrevlogheader(t)

565

engine = util.compengines.forrevlogheader(t)

566

compressor = engine.revlogcompressor(

566

compressor = engine.revlogcompressor(

567

self.feature_config.compression_engine_options

567

self.feature_config.compression_engine_options

568

)

568

)

569

self._decompressors[t] = compressor

569

self._decompressors[t] = compressor

570

except KeyError:

570

except KeyError:

571

raise error.RevlogError(

571

raise error.RevlogError(

572

_(b'unknown compression type %s') % binascii.hexlify(t)

572

_(b'unknown compression type %s') % binascii.hexlify(t)

573

)

573

)

574

return compressor

574

return compressor

575

576

def compress(self, data):

576

def compress(self, data):

577

"""Generate a possibly-compressed representation of data."""

577

"""Generate a possibly-compressed representation of data."""

578

if not data:

578

if not data:

579

return b'', data

579

return b'', data

580

581

compressed = self._compressor.compress(data)

581

compressed = self._compressor.compress(data)

582

583

if compressed:

583

if compressed:

584

# The revlog compressor added the header in the returned data.

584

# The revlog compressor added the header in the returned data.

585

return b'', compressed

585

return b'', compressed

586

587

if data[0:1] == b'\0':

587

if data[0:1] == b'\0':

588

return b'', data

588

return b'', data

589

return b'u', data

589

return b'u', data

590

591

def decompress(self, data):

591

def decompress(self, data):

592

"""Decompress a revlog chunk.

592

"""Decompress a revlog chunk.

593

594

The chunk is expected to begin with a header identifying the

594

The chunk is expected to begin with a header identifying the

595

format type so it can be routed to an appropriate decompressor.

595

format type so it can be routed to an appropriate decompressor.

596

"""

596

"""

597

if not data:

597

if not data:

598

return data

598

return data

599

600

# Revlogs are read much more frequently than they are written and many

600

# Revlogs are read much more frequently than they are written and many

601

# chunks only take microseconds to decompress, so performance is

601

# chunks only take microseconds to decompress, so performance is

602

# important here.

602

# important here.

603

#

603

#

604

# We can make a few assumptions about revlogs:

604

# We can make a few assumptions about revlogs:

605

#

605

#

606

# 1) the majority of chunks will be compressed (as opposed to inline

606

# 1) the majority of chunks will be compressed (as opposed to inline

607

# raw data).

607

# raw data).

608

# 2) decompressing *any* data will likely by at least 10x slower than

608

# 2) decompressing *any* data will likely by at least 10x slower than

609

# returning raw inline data.

609

# returning raw inline data.

610

# 3) we want to prioritize common and officially supported compression

610

# 3) we want to prioritize common and officially supported compression

611

# engines

611

# engines

612

#

612

#

613

# It follows that we want to optimize for "decompress compressed data

613

# It follows that we want to optimize for "decompress compressed data

614

# when encoded with common and officially supported compression engines"

614

# when encoded with common and officially supported compression engines"

615

# case over "raw data" and "data encoded by less common or non-official

615

# case over "raw data" and "data encoded by less common or non-official

616

# compression engines." That is why we have the inline lookup first

616

# compression engines." That is why we have the inline lookup first

617

# followed by the compengines lookup.

617

# followed by the compengines lookup.

618

#

618

#

619

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

619

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

620

# compressed chunks. And this matters for changelog and manifest reads.

620

# compressed chunks. And this matters for changelog and manifest reads.

621

t = data[0:1]

621

t = data[0:1]

622

623

if t == b'x':

623

if t == b'x':

624

try:

624

try:

625

return _zlibdecompress(data)

625

return _zlibdecompress(data)

626

except zlib.error as e:

626

except zlib.error as e:

627

raise error.RevlogError(

627

raise error.RevlogError(

628

_(b'revlog decompress error: %s')

628

_(b'revlog decompress error: %s')

629

% stringutil.forcebytestr(e)

629

% stringutil.forcebytestr(e)

630

)

630

)

631

# '\0' is more common than 'u' so it goes first.

631

# '\0' is more common than 'u' so it goes first.

632

elif t == b'\0':

632

elif t == b'\0':

633

return data

633

return data

634

elif t == b'u':

634

elif t == b'u':

635

return util.buffer(data, 1)

635

return util.buffer(data, 1)

636

637

compressor = self._get_decompressor(t)

637

compressor = self._get_decompressor(t)

638

639

return compressor.decompress(data)

639

return compressor.decompress(data)

640

641

@contextlib.contextmanager

641

@contextlib.contextmanager

642

def reading(self):

642

def reading(self):

643

"""Context manager that keeps data and sidedata files open for reading"""

643

"""Context manager that keeps data and sidedata files open for reading"""

644

if len(self.index) == 0:

644

if len(self.index) == 0:

645

yield # nothing to be read

645

yield # nothing to be read

646

elif self._delay_buffer is not None and self.inline:

646

elif self._delay_buffer is not None and self.inline:

647

msg = "revlog with delayed write should not be inline"

647

msg = "revlog with delayed write should not be inline"

648

raise error.ProgrammingError(msg)

648

raise error.ProgrammingError(msg)

649

else:

649

else:

650

with self._segmentfile.reading():

650

with self._segmentfile.reading():

651

with self._segmentfile_sidedata.reading():

651

with self._segmentfile_sidedata.reading():

652

yield

652

yield

653

654

@property

654

@property

655

def is_writing(self):

655

def is_writing(self):

656

"""True is a writing context is open"""

656

"""True is a writing context is open"""

657

return self._writinghandles is not None

657

return self._writinghandles is not None

658

659

@property

659

@property

660

def is_open(self):

660

def is_open(self):

661

"""True if any file handle is being held

661

"""True if any file handle is being held

662

663

Used for assert and debug in the python code"""

663

Used for assert and debug in the python code"""

664

return self._segmentfile.is_open or self._segmentfile_sidedata.is_open

664

return self._segmentfile.is_open or self._segmentfile_sidedata.is_open

665

666

@contextlib.contextmanager

666

@contextlib.contextmanager

667

def writing(self, transaction, data_end=None, sidedata_end=None):

667

def writing(self, transaction, data_end=None, sidedata_end=None):

668

"""Open the revlog files for writing

668

"""Open the revlog files for writing

669

670

Add content to a revlog should be done within such context.

670

Add content to a revlog should be done within such context.

671

"""

671

"""

672

if self.is_writing:

672

if self.is_writing:

673

yield

673

yield

674

else:

674

else:

675

ifh = dfh = sdfh = None

675

ifh = dfh = sdfh = None

676

try:

676

try:

677

r = len(self.index)

677

r = len(self.index)

678

# opening the data file.

678

# opening the data file.

679

dsize = 0

679

dsize = 0

680

if r:

680

if r:

681

dsize = self.end(r - 1)

681

dsize = self.end(r - 1)

682

dfh = None

682

dfh = None

683

if not self.inline:

683

if not self.inline:

684

try:

684

try:

685

dfh = self.opener(self.data_file, mode=b"r+")

685

dfh = self.opener(self.data_file, mode=b"r+")

686

if data_end is None:

686

if data_end is None:

687

dfh.seek(0, os.SEEK_END)

687

dfh.seek(0, os.SEEK_END)

688

else:

688

else:

689

dfh.seek(data_end, os.SEEK_SET)

689

dfh.seek(data_end, os.SEEK_SET)

690

except FileNotFoundError:

690

except FileNotFoundError:

691

dfh = self.opener(self.data_file, mode=b"w+")

691

dfh = self.opener(self.data_file, mode=b"w+")

692

transaction.add(self.data_file, dsize)

692

transaction.add(self.data_file, dsize)

693

if self.sidedata_file is not None:

693

if self.sidedata_file is not None:

694

assert sidedata_end is not None

694

assert sidedata_end is not None

695

# revlog-v2 does not inline, help Pytype

695

# revlog-v2 does not inline, help Pytype

696

assert dfh is not None

696

assert dfh is not None

697

try:

697

try:

698

sdfh = self.opener(self.sidedata_file, mode=b"r+")

698

sdfh = self.opener(self.sidedata_file, mode=b"r+")

699

dfh.seek(sidedata_end, os.SEEK_SET)

699

dfh.seek(sidedata_end, os.SEEK_SET)

700

except FileNotFoundError:

700

except FileNotFoundError:

701

sdfh = self.opener(self.sidedata_file, mode=b"w+")

701

sdfh = self.opener(self.sidedata_file, mode=b"w+")

702

transaction.add(self.sidedata_file, sidedata_end)

702

transaction.add(self.sidedata_file, sidedata_end)

703

704

# opening the index file.

704

# opening the index file.

705

isize = r * self.index.entry_size

705

isize = r * self.index.entry_size

706

ifh = self.__index_write_fp()

706

ifh = self.__index_write_fp()

707

if self.inline:

707

if self.inline:

708

transaction.add(self.index_file, dsize + isize)

708

transaction.add(self.index_file, dsize + isize)

709

else:

709

else:

710

transaction.add(self.index_file, isize)

710

transaction.add(self.index_file, isize)

711

# exposing all file handle for writing.

711

# exposing all file handle for writing.

712

self._writinghandles = (ifh, dfh, sdfh)

712

self._writinghandles = (ifh, dfh, sdfh)

713

self._segmentfile.writing_handle = ifh if self.inline else dfh

713

self._segmentfile.writing_handle = ifh if self.inline else dfh

714

self._segmentfile_sidedata.writing_handle = sdfh

714

self._segmentfile_sidedata.writing_handle = sdfh

715

yield

715

yield

716

finally:

716

finally:

717

self._writinghandles = None

717

self._writinghandles = None

718

self._segmentfile.writing_handle = None

718

self._segmentfile.writing_handle = None

719

self._segmentfile_sidedata.writing_handle = None

719

self._segmentfile_sidedata.writing_handle = None

720

if dfh is not None:

720

if dfh is not None:

721

dfh.close()

721

dfh.close()

722

if sdfh is not None:

722

if sdfh is not None:

723

sdfh.close()

723

sdfh.close()

724

# closing the index file last to avoid exposing referent to

724

# closing the index file last to avoid exposing referent to

725

# potential unflushed data content.

725

# potential unflushed data content.

726

if ifh is not None:

726

if ifh is not None:

727

ifh.close()

727

ifh.close()

728

729

def __index_write_fp(self, index_end=None):

729

def __index_write_fp(self, index_end=None):

730

"""internal method to open the index file for writing

730

"""internal method to open the index file for writing

731

732

You should not use this directly and use `_writing` instead

732

You should not use this directly and use `_writing` instead

733

"""

733

"""

734

try:

734

try:

735

if self._delay_buffer is None:

735

if self._delay_buffer is None:

736

f = self.opener(

736

f = self.opener(

737

self.index_file,

737

self.index_file,

738

mode=b"r+",

738

mode=b"r+",

739

checkambig=self.data_config.check_ambig,

739

checkambig=self.data_config.check_ambig,

740

)

740

)

741

else:

741

else:

742

# check_ambig affect we way we open file for writing, however

742

# check_ambig affect we way we open file for writing, however

743

# here, we do not actually open a file for writting as write

743

# here, we do not actually open a file for writting as write

744

# will appened to a delay_buffer. So check_ambig is not

744

# will appened to a delay_buffer. So check_ambig is not

745

# meaningful and unneeded here.

745

# meaningful and unneeded here.

746

f = randomaccessfile.appender(

746

f = randomaccessfile.appender(

747

self.opener, self.index_file, b"r+", self._delay_buffer

747

self.opener, self.index_file, b"r+", self._delay_buffer

748

)

748

)

749

if index_end is None:

749

if index_end is None:

750

f.seek(0, os.SEEK_END)

750

f.seek(0, os.SEEK_END)

751

else:

751

else:

752

f.seek(index_end, os.SEEK_SET)

752

f.seek(index_end, os.SEEK_SET)

753

return f

753

return f

754

except FileNotFoundError:

754

except FileNotFoundError:

755

if self._delay_buffer is None:

755

if self._delay_buffer is None:

756

return self.opener(

756

return self.opener(

757

self.index_file,

757

self.index_file,

758

mode=b"w+",

758

mode=b"w+",

759

checkambig=self.data_config.check_ambig,

759

checkambig=self.data_config.check_ambig,

760

)

760

)

761

else:

761

else:

762

return randomaccessfile.appender(

762

return randomaccessfile.appender(

763

self.opener, self.index_file, b"w+", self._delay_buffer

763

self.opener, self.index_file, b"w+", self._delay_buffer

764

)

764

)

765

766

def __index_new_fp(self):

766

def __index_new_fp(self):

767

"""internal method to create a new index file for writing

767

"""internal method to create a new index file for writing

768

769

You should not use this unless you are upgrading from inline revlog

769

You should not use this unless you are upgrading from inline revlog

770

"""

770

"""

771

return self.opener(

771

return self.opener(

772

self.index_file,

772

self.index_file,

773

mode=b"w",

773

mode=b"w",

774

checkambig=self.data_config.check_ambig,

774

checkambig=self.data_config.check_ambig,

775

atomictemp=True,

775

atomictemp=True,

776

)

776

)

777

778

def split_inline(self, tr, header, new_index_file_path=None):

778

def split_inline(self, tr, header, new_index_file_path=None):

779

"""split the data of an inline revlog into an index and a data file"""

779

"""split the data of an inline revlog into an index and a data file"""

780

assert self._delay_buffer is None

780

assert self._delay_buffer is None

781

existing_handles = False

781

existing_handles = False

782

if self._writinghandles is not None:

782

if self._writinghandles is not None:

783

existing_handles = True

783

existing_handles = True

784

fp = self._writinghandles[0]

784

fp = self._writinghandles[0]

785

fp.flush()

785

fp.flush()

786

fp.close()

786

fp.close()

787

# We can't use the cached file handle after close(). So prevent

787

# We can't use the cached file handle after close(). So prevent

788

# its usage.

788

# its usage.

789

self._writinghandles = None

789

self._writinghandles = None

790

self._segmentfile.writing_handle = None

790

self._segmentfile.writing_handle = None

791

# No need to deal with sidedata writing handle as it is only

791

# No need to deal with sidedata writing handle as it is only

792

# relevant with revlog-v2 which is never inline, not reaching

792

# relevant with revlog-v2 which is never inline, not reaching

793

# this code

793

# this code

794

795

new_dfh = self.opener(self.data_file, mode=b"w+")

795

new_dfh = self.opener(self.data_file, mode=b"w+")

796

new_dfh.truncate(0) # drop any potentially existing data

796

new_dfh.truncate(0) # drop any potentially existing data

797

try:

797

try:

798

with self.reading():

798

with self.reading():

799

for r in range(len(self.index)):

799

for r in range(len(self.index)):

800

new_dfh.write(self.get_segment_for_revs(r, r)[1])

800

new_dfh.write(self.get_segment_for_revs(r, r)[1])

801

new_dfh.flush()

801

new_dfh.flush()

802

803

if new_index_file_path is not None:

803

if new_index_file_path is not None:

804

self.index_file = new_index_file_path

804

self.index_file = new_index_file_path

805

with self.__index_new_fp() as fp:

805

with self.__index_new_fp() as fp:

806

self.inline = False

806

self.inline = False

807

for i in range(len(self.index)):

807

for i in range(len(self.index)):

808

e = self.index.entry_binary(i)

808

e = self.index.entry_binary(i)

809

if i == 0:

809

if i == 0:

810

packed_header = self.index.pack_header(header)

810

packed_header = self.index.pack_header(header)

811

e = packed_header + e

811

e = packed_header + e

812

fp.write(e)

812

fp.write(e)

813

814

# If we don't use side-write, the temp file replace the real

814

# If we don't use side-write, the temp file replace the real

815

# index when we exit the context manager

815

# index when we exit the context manager

816

817

self._segmentfile = randomaccessfile.randomaccessfile(

817

self._segmentfile = randomaccessfile.randomaccessfile(

818

self.opener,

818

self.opener,

819

self.data_file,

819

self.data_file,

820

self.data_config.chunk_cache_size,

820

self.data_config.chunk_cache_size,

821

)

821

)

822

823

if existing_handles:

823

if existing_handles:

824

# switched from inline to conventional reopen the index

824

# switched from inline to conventional reopen the index

825

ifh = self.__index_write_fp()

825

ifh = self.__index_write_fp()

826

self._writinghandles = (ifh, new_dfh, None)

826

self._writinghandles = (ifh, new_dfh, None)

827

self._segmentfile.writing_handle = new_dfh

827

self._segmentfile.writing_handle = new_dfh

828

new_dfh = None

828

new_dfh = None

829

# No need to deal with sidedata writing handle as it is only

829

# No need to deal with sidedata writing handle as it is only

830

# relevant with revlog-v2 which is never inline, not reaching

830

# relevant with revlog-v2 which is never inline, not reaching

831

# this code

831

# this code

832

finally:

832

finally:

833

if new_dfh is not None:

833

if new_dfh is not None:

834

new_dfh.close()

834

new_dfh.close()

835

return self.index_file

835

return self.index_file

836

837

def get_segment_for_revs(self, startrev, endrev):

837

def get_segment_for_revs(self, startrev, endrev):

838

"""Obtain a segment of raw data corresponding to a range of revisions.

838

"""Obtain a segment of raw data corresponding to a range of revisions.

839

840

Accepts the start and end revisions and an optional already-open

840

Accepts the start and end revisions and an optional already-open

841

file handle to be used for reading. If the file handle is read, its

841

file handle to be used for reading. If the file handle is read, its

842

seek position will not be preserved.

842

seek position will not be preserved.

843

844

Requests for data may be satisfied by a cache.

844

Requests for data may be satisfied by a cache.

845

846

Returns a 2-tuple of (offset, data) for the requested range of

846

Returns a 2-tuple of (offset, data) for the requested range of

847

revisions. Offset is the integer offset from the beginning of the

847

revisions. Offset is the integer offset from the beginning of the

848

revlog and data is a str or buffer of the raw byte data.

848

revlog and data is a str or buffer of the raw byte data.

849

850

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

850

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

851

to determine where each revision's data begins and ends.

851

to determine where each revision's data begins and ends.

852

853

API: we should consider making this a private part of the InnerRevlog

853

API: we should consider making this a private part of the InnerRevlog

854

at some point.

854

at some point.

855

"""

855

"""

856

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

856

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

857

# (functions are expensive).

857

# (functions are expensive).

858

index = self.index

858

index = self.index

859

istart = index[startrev]

859

istart = index[startrev]

860

start = int(istart[0] >> 16)

860

start = int(istart[0] >> 16)

861

if startrev == endrev:

861

if startrev == endrev:

862

end = start + istart[1]

862

end = start + istart[1]

863

else:

863

else:

864

iend = index[endrev]

864

iend = index[endrev]

865

end = int(iend[0] >> 16) + iend[1]

865

end = int(iend[0] >> 16) + iend[1]

866

867

if self.inline:

867

if self.inline:

868

start += (startrev + 1) * self.index.entry_size

868

start += (startrev + 1) * self.index.entry_size

869

end += (endrev + 1) * self.index.entry_size

869

end += (endrev + 1) * self.index.entry_size

870

length = end - start

870

length = end - start

871

872

return start, self._segmentfile.read_chunk(start, length)

872

return start, self._segmentfile.read_chunk(start, length)

873

874

def _chunk(self, rev):

874

def _chunk(self, rev):

875

"""Obtain a single decompressed chunk for a revision.

875

"""Obtain a single decompressed chunk for a revision.

876

877

Accepts an integer revision and an optional already-open file handle

877

Accepts an integer revision and an optional already-open file handle

878

to be used for reading. If used, the seek position of the file will not

878

to be used for reading. If used, the seek position of the file will not

879

be preserved.

879

be preserved.

880

881

Returns a str holding uncompressed data for the requested revision.

881

Returns a str holding uncompressed data for the requested revision.

882

"""

882

"""

883

if self._uncompressed_chunk_cache is not None:

883

if self._uncompressed_chunk_cache is not None:

884

uncomp = self._uncompressed_chunk_cache.get(rev)

884

uncomp = self._uncompressed_chunk_cache.get(rev)

885

if uncomp is not None:

885

if uncomp is not None:

886

return uncomp

886

return uncomp

887

888

compression_mode = self.index[rev][10]

888

compression_mode = self.index[rev][10]

889

data = self.get_segment_for_revs(rev, rev)[1]

889

data = self.get_segment_for_revs(rev, rev)[1]

890

if compression_mode == COMP_MODE_PLAIN:

890

if compression_mode == COMP_MODE_PLAIN:

891

uncomp = data

891

uncomp = data

892

elif compression_mode == COMP_MODE_DEFAULT:

892

elif compression_mode == COMP_MODE_DEFAULT:

893

uncomp = self._decompressor(data)

893

uncomp = self._decompressor(data)

894

elif compression_mode == COMP_MODE_INLINE:

894

elif compression_mode == COMP_MODE_INLINE:

895

uncomp = self.decompress(data)

895

uncomp = self.decompress(data)

896

else:

896

else:

897

msg = b'unknown compression mode %d'

897

msg = b'unknown compression mode %d'

898

msg %= compression_mode

898

msg %= compression_mode

899

raise error.RevlogError(msg)

899

raise error.RevlogError(msg)

900

if self._uncompressed_chunk_cache is not None:

900

if self._uncompressed_chunk_cache is not None:

901

self._uncompressed_chunk_cache.insert(rev, uncomp, cost=len(uncomp))

901

self._uncompressed_chunk_cache.insert(rev, uncomp, cost=len(uncomp))

902

return uncomp

902

return uncomp

903

904

def _chunks(self, revs, targetsize=None):

904

def _chunks(self, revs, targetsize=None):

905

"""Obtain decompressed chunks for the specified revisions.

905

"""Obtain decompressed chunks for the specified revisions.

906

907

Accepts an iterable of numeric revisions that are assumed to be in

907

Accepts an iterable of numeric revisions that are assumed to be in

908

ascending order. Also accepts an optional already-open file handle

908

ascending order. Also accepts an optional already-open file handle

909

to be used for reading. If used, the seek position of the file will

909

to be used for reading. If used, the seek position of the file will

910

not be preserved.

910

not be preserved.

911

912

This function is similar to calling ``self._chunk()`` multiple times,

912

This function is similar to calling ``self._chunk()`` multiple times,

913

but is faster.

913

but is faster.

914

915

Returns a list with decompressed data for each requested revision.

915

Returns a list with decompressed data for each requested revision.

916

"""

916

"""

917

if not revs:

917

if not revs:

918

return []

918

return []

919

start = self.start

919

start = self.start

920

length = self.length

920

length = self.length

921

inline = self.inline

921

inline = self.inline

922

iosize = self.index.entry_size

922

iosize = self.index.entry_size

923

buffer = util.buffer

923

buffer = util.buffer

924

925

fetched_revs = []

925

fetched_revs = []

926

fadd = fetched_revs.append

926

fadd = fetched_revs.append

927

928

chunks = []

928

chunks = []

929

ladd = chunks.append

929

ladd = chunks.append

930

931

if self._uncompressed_chunk_cache is None:

931

if self._uncompressed_chunk_cache is None:

932

fetched_revs = revs

932

fetched_revs = revs

933

else:

933

else:

934

for rev in revs:

934

for rev in revs:

935

cached_value = self._uncompressed_chunk_cache.get(rev)

935

cached_value = self._uncompressed_chunk_cache.get(rev)

936

if cached_value is None:

936

if cached_value is None:

937

fadd(rev)

937

fadd(rev)

938

else:

938

else:

939

ladd((rev, cached_value))

939

ladd((rev, cached_value))

940

941

if not fetched_revs:

941

if not fetched_revs:

942

slicedchunks = ()

942

slicedchunks = ()

943

elif not self.data_config.with_sparse_read:

943

elif not self.data_config.with_sparse_read:

944

slicedchunks = (fetched_revs,)

944

slicedchunks = (fetched_revs,)

945

else:

945

else:

946

slicedchunks = deltautil.slicechunk(

946

slicedchunks = deltautil.slicechunk(

947

self,

947

self,

948

fetched_revs,

948

fetched_revs,

949

targetsize=targetsize,

949

targetsize=targetsize,

950

)

950

)

951

952

for revschunk in slicedchunks:

952

for revschunk in slicedchunks:

953

firstrev = revschunk[0]

953

firstrev = revschunk[0]

954

# Skip trailing revisions with empty diff

954

# Skip trailing revisions with empty diff

955

for lastrev in revschunk[::-1]:

955

for lastrev in revschunk[::-1]:

956

if length(lastrev) != 0:

956

if length(lastrev) != 0:

957

break

957

break

958

959

try:

959

try:

960

offset, data = self.get_segment_for_revs(firstrev, lastrev)

960

offset, data = self.get_segment_for_revs(firstrev, lastrev)

961

except OverflowError:

961

except OverflowError:

962

# issue4215 - we can't cache a run of chunks greater than

962

# issue4215 - we can't cache a run of chunks greater than

963

# 2G on Windows

963

# 2G on Windows

964

for rev in revschunk:

964

for rev in revschunk:

965

ladd((rev, self._chunk(rev)))

965

ladd((rev, self._chunk(rev)))

966

967

decomp = self.decompress

967

decomp = self.decompress

968

# self._decompressor might be None, but will not be used in that case

968

# self._decompressor might be None, but will not be used in that case

969

def_decomp = self._decompressor

969

def_decomp = self._decompressor

970

for rev in revschunk:

970

for rev in revschunk:

971

chunkstart = start(rev)

971

chunkstart = start(rev)

972

if inline:

972

if inline:

973

chunkstart += (rev + 1) * iosize

973

chunkstart += (rev + 1) * iosize

974

chunklength = length(rev)

974

chunklength = length(rev)

975

comp_mode = self.index[rev][10]

975

comp_mode = self.index[rev][10]

976

c = buffer(data, chunkstart - offset, chunklength)

976

c = buffer(data, chunkstart - offset, chunklength)

977

if comp_mode == COMP_MODE_PLAIN:

977

if comp_mode == COMP_MODE_PLAIN:

978

c = c

978

c = c

979

elif comp_mode == COMP_MODE_INLINE:

979

elif comp_mode == COMP_MODE_INLINE:

980

c = decomp(c)

980

c = decomp(c)

981

elif comp_mode == COMP_MODE_DEFAULT:

981

elif comp_mode == COMP_MODE_DEFAULT:

982

c = def_decomp(c)

982

c = def_decomp(c)

983

else:

983

else:

984

msg = b'unknown compression mode %d'

984

msg = b'unknown compression mode %d'

985

msg %= comp_mode

985

msg %= comp_mode

986

raise error.RevlogError(msg)

986

raise error.RevlogError(msg)

987

ladd((rev, c))

987

ladd((rev, c))

988

if self._uncompressed_chunk_cache is not None:

988

if self._uncompressed_chunk_cache is not None:

989

self._uncompressed_chunk_cache.insert(rev, c, len(c))

989

self._uncompressed_chunk_cache.insert(rev, c, len(c))

990

991

chunks.sort()

991

chunks.sort()

992

return [x[1] for x in chunks]

992

return [x[1] for x in chunks]

993

994

def raw_text(self, node, rev):

994

def raw_text(self, node, rev):

995

"""return the possibly unvalidated rawtext for a revision

995

"""return the possibly unvalidated rawtext for a revision

996

997

returns (rev, rawtext, validated)

997

returns (rev, rawtext, validated)

998

"""

998

"""

999

1000

# revision in the cache (could be useful to apply delta)

1000

# revision in the cache (could be useful to apply delta)

1001

cachedrev = None

1001

cachedrev = None

1002

# An intermediate text to apply deltas to

1002

# An intermediate text to apply deltas to

1003

basetext = None

1003

basetext = None

1004

1005

# Check if we have the entry in cache

1005

# Check if we have the entry in cache

1006

# The cache entry looks like (node, rev, rawtext)

1006

# The cache entry looks like (node, rev, rawtext)

1007

if self._revisioncache:

1007

if self._revisioncache:

1008

cachedrev = self._revisioncache[1]

1008

cachedrev = self._revisioncache[1]

1009

1010

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

1010

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

1011

if stopped:

1011

if stopped:

1012

basetext = self._revisioncache[2]

1012

basetext = self._revisioncache[2]

1013

1014

# drop cache to save memory, the caller is expected to

1014

# drop cache to save memory, the caller is expected to

1015

# update self._inner._revisioncache after validating the text

1015

# update self._inner._revisioncache after validating the text

1016

self._revisioncache = None

1016

self._revisioncache = None

1017

1018

targetsize = None

1018

targetsize = None

1019

rawsize = self.index[rev][2]

1019

rawsize = self.index[rev][2]

1020

if 0 <= rawsize:

1020

if 0 <= rawsize:

1021

targetsize = 4 * rawsize

1021

targetsize = 4 * rawsize

1022

1023

if self._uncompressed_chunk_cache is not None:

1023

if self._uncompressed_chunk_cache is not None:

1024

# dynamically update the uncompressed_chunk_cache size to the

1024

# dynamically update the uncompressed_chunk_cache size to the

1025

# largest revision we saw in this revlog.

1025

# largest revision we saw in this revlog.

1026

factor = self.data_config.uncompressed_cache_factor

1026

factor = self.data_config.uncompressed_cache_factor

1027

candidate_size = rawsize * factor

1027

candidate_size = rawsize * factor

1028

if candidate_size > self._uncompressed_chunk_cache.maxcost:

1028

if candidate_size > self._uncompressed_chunk_cache.maxcost:

1029

self._uncompressed_chunk_cache.maxcost = candidate_size

1029

self._uncompressed_chunk_cache.maxcost = candidate_size

1030

1031

bins = self._chunks(chain, targetsize=targetsize)

1031

bins = self._chunks(chain, targetsize=targetsize)

1032

if basetext is None:

1032

if basetext is None:

1033

basetext = bytes(bins[0])

1033

basetext = bytes(bins[0])

1034

bins = bins[1:]

1034

bins = bins[1:]

1035

1036

rawtext = mdiff.patches(basetext, bins)

1036

rawtext = mdiff.patches(basetext, bins)

1037

del basetext # let us have a chance to free memory early

1037

del basetext # let us have a chance to free memory early

1038

return (rev, rawtext, False)

1038

return (rev, rawtext, False)

1039

1040

def sidedata(self, rev, sidedata_end):

1040

def sidedata(self, rev, sidedata_end):

1041

"""Return the sidedata for a given revision number."""

1041

"""Return the sidedata for a given revision number."""

1042

index_entry = self.index[rev]

1042

index_entry = self.index[rev]

1043

sidedata_offset = index_entry[8]

1043

sidedata_offset = index_entry[8]

1044

sidedata_size = index_entry[9]

1044

sidedata_size = index_entry[9]

1045

1046

if self.inline:

1046

if self.inline:

1047

sidedata_offset += self.index.entry_size * (1 + rev)

1047

sidedata_offset += self.index.entry_size * (1 + rev)

1048

if sidedata_size == 0:

1048

if sidedata_size == 0:

1049

return {}

1049

return {}

1050

1051

if sidedata_end < sidedata_offset + sidedata_size:

1051

if sidedata_end < sidedata_offset + sidedata_size:

1052

filename = self.sidedata_file

1052

filename = self.sidedata_file

1053

end = sidedata_end

1053

end = sidedata_end

1054

offset = sidedata_offset

1054

offset = sidedata_offset

1055

length = sidedata_size

1055

length = sidedata_size

1056

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

1056

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

1057

raise error.RevlogError(m)

1057

raise error.RevlogError(m)

1058

1059

comp_segment = self._segmentfile_sidedata.read_chunk(

1059

comp_segment = self._segmentfile_sidedata.read_chunk(

1060

sidedata_offset, sidedata_size

1060

sidedata_offset, sidedata_size

1061

)

1061

)

1062

1063

comp = self.index[rev][11]

1063

comp = self.index[rev][11]

1064

if comp == COMP_MODE_PLAIN:

1064

if comp == COMP_MODE_PLAIN:

1065

segment = comp_segment

1065

segment = comp_segment

1066

elif comp == COMP_MODE_DEFAULT:

1066

elif comp == COMP_MODE_DEFAULT:

1067

segment = self._decompressor(comp_segment)

1067

segment = self._decompressor(comp_segment)

1068

elif comp == COMP_MODE_INLINE:

1068

elif comp == COMP_MODE_INLINE:

1069

segment = self.decompress(comp_segment)

1069

segment = self.decompress(comp_segment)

1070

else:

1070

else:

1071

msg = b'unknown compression mode %d'

1071

msg = b'unknown compression mode %d'

1072

msg %= comp

1072

msg %= comp

1073

raise error.RevlogError(msg)

1073

raise error.RevlogError(msg)

1074

1075

sidedata = sidedatautil.deserialize_sidedata(segment)

1075

sidedata = sidedatautil.deserialize_sidedata(segment)

1076

return sidedata

1076

return sidedata

1077

1078

def write_entry(

1078

def write_entry(

1079

self,

1079

self,

1080

transaction,

1080

transaction,

1081

entry,

1081

entry,

1082

data,

1082

data,

1083

link,

1083

link,

1084

offset,

1084

offset,

1085

sidedata,

1085

sidedata,

1086

sidedata_offset,

1086

sidedata_offset,

1087

index_end,

1087

index_end,

1088

data_end,

1088

data_end,

1089

sidedata_end,

1089

sidedata_end,

1090

):

1090

):

1091

# Files opened in a+ mode have inconsistent behavior on various

1091

# Files opened in a+ mode have inconsistent behavior on various

1092

# platforms. Windows requires that a file positioning call be made

1092

# platforms. Windows requires that a file positioning call be made

1093

# when the file handle transitions between reads and writes. See

1093

# when the file handle transitions between reads and writes. See

1094

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

1094

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

1095

# platforms, Python or the platform itself can be buggy. Some versions

1095

# platforms, Python or the platform itself can be buggy. Some versions

1096

# of Solaris have been observed to not append at the end of the file

1096

# of Solaris have been observed to not append at the end of the file

1097

# if the file was seeked to before the end. See issue4943 for more.

1097

# if the file was seeked to before the end. See issue4943 for more.

1098

#

1098

#

1099

# We work around this issue by inserting a seek() before writing.

1099

# We work around this issue by inserting a seek() before writing.

1100

# Note: This is likely not necessary on Python 3. However, because

1100

# Note: This is likely not necessary on Python 3. However, because

1101

# the file handle is reused for reads and may be seeked there, we need

1101

# the file handle is reused for reads and may be seeked there, we need

1102

# to be careful before changing this.

1102

# to be careful before changing this.

1103

if self._writinghandles is None:

1103

if self._writinghandles is None:

1104

msg = b'adding revision outside `revlog._writing` context'

1104

msg = b'adding revision outside `revlog._writing` context'

1105

raise error.ProgrammingError(msg)

1105

raise error.ProgrammingError(msg)

1106

ifh, dfh, sdfh = self._writinghandles

1106

ifh, dfh, sdfh = self._writinghandles

1107

if index_end is None:

1107

if index_end is None:

1108

ifh.seek(0, os.SEEK_END)

1108

ifh.seek(0, os.SEEK_END)

1109

else:

1109

else:

1110

ifh.seek(index_end, os.SEEK_SET)

1110

ifh.seek(index_end, os.SEEK_SET)

1111

if dfh:

1111

if dfh:

1112

if data_end is None:

1112

if data_end is None:

1113

dfh.seek(0, os.SEEK_END)

1113

dfh.seek(0, os.SEEK_END)

1114

else:

1114

else:

1115

dfh.seek(data_end, os.SEEK_SET)

1115

dfh.seek(data_end, os.SEEK_SET)

1116

if sdfh:

1116

if sdfh:

1117

sdfh.seek(sidedata_end, os.SEEK_SET)

1117

sdfh.seek(sidedata_end, os.SEEK_SET)

1118

1119

curr = len(self.index) - 1

1119

curr = len(self.index) - 1

1120

if not self.inline:

1120

if not self.inline:

1121

transaction.add(self.data_file, offset)

1121

transaction.add(self.data_file, offset)

1122

if self.sidedata_file:

1122

if self.sidedata_file:

1123

transaction.add(self.sidedata_file, sidedata_offset)

1123

transaction.add(self.sidedata_file, sidedata_offset)

1124

transaction.add(self.canonical_index_file, curr * len(entry))

1124

transaction.add(self.canonical_index_file, curr * len(entry))

1125

if data[0]:

1125

if data[0]:

1126

dfh.write(data[0])

1126

dfh.write(data[0])

1127

dfh.write(data[1])

1127

dfh.write(data[1])

1128

if sidedata:

1128

if sidedata:

1129

sdfh.write(sidedata)

1129

sdfh.write(sidedata)

1130

if self._delay_buffer is None:

1130

if self._delay_buffer is None:

1131

ifh.write(entry)

1131

ifh.write(entry)

1132

else:

1132

else:

1133

self._delay_buffer.append(entry)

1133

self._delay_buffer.append(entry)

1134

elif self._delay_buffer is not None:

1134

elif self._delay_buffer is not None:

1135

msg = b'invalid delayed write on inline revlog'

1135

msg = b'invalid delayed write on inline revlog'

1136

raise error.ProgrammingError(msg)

1136

raise error.ProgrammingError(msg)

1137

else:

1137

else:

1138

offset += curr * self.index.entry_size

1138

offset += curr * self.index.entry_size

1139

transaction.add(self.canonical_index_file, offset)

1139

transaction.add(self.canonical_index_file, offset)

1140

assert not sidedata

1140

assert not sidedata

1141

ifh.write(entry)

1141

ifh.write(entry)

1142

ifh.write(data[0])

1142

ifh.write(data[0])

1143

ifh.write(data[1])

1143

ifh.write(data[1])

1144

return (

1144

return (

1145

ifh.tell(),

1145

ifh.tell(),

1146

dfh.tell() if dfh else None,

1146

dfh.tell() if dfh else None,

1147

sdfh.tell() if sdfh else None,

1147

sdfh.tell() if sdfh else None,

1148

)

1148

)

1149

1150

def _divert_index(self):

1150

def _divert_index(self):

1151

return self.index_file + b'.a'

1151

return self.index_file + b'.a'

1152

1153

def delay(self):

1153

def delay(self):

1154

assert not self.is_open

1154

assert not self.is_open

1155

if self.inline:

1155

if self.inline:

1156

msg = "revlog with delayed write should not be inline"

1156

msg = "revlog with delayed write should not be inline"

1157

raise error.ProgrammingError(msg)

1157

raise error.ProgrammingError(msg)

1158

if self._delay_buffer is not None or self._orig_index_file is not None:

1158

if self._delay_buffer is not None or self._orig_index_file is not None:

1159

# delay or divert already in place

1159

# delay or divert already in place

1160

return None

1160

return None

1161

elif len(self.index) == 0:

1161

elif len(self.index) == 0:

1162

self._orig_index_file = self.index_file

1162

self._orig_index_file = self.index_file

1163

self.index_file = self._divert_index()

1163

self.index_file = self._divert_index()

1164

assert self._orig_index_file is not None

1164

assert self._orig_index_file is not None

1165

assert self.index_file is not None

1165

assert self.index_file is not None

1166

if self.opener.exists(self.index_file):

1166

if self.opener.exists(self.index_file):

1167

self.opener.unlink(self.index_file)

1167

self.opener.unlink(self.index_file)

1168

return self.index_file

1168

return self.index_file

1169

else:

1169

else:

1170

self._delay_buffer = []

1170

self._delay_buffer = []

1171

return None

1171

return None

1172

1173

def write_pending(self):

1173

def write_pending(self):

1174

assert not self.is_open

1174

assert not self.is_open

1175

if self.inline:

1175

if self.inline:

1176

msg = "revlog with delayed write should not be inline"

1176

msg = "revlog with delayed write should not be inline"

1177

raise error.ProgrammingError(msg)

1177

raise error.ProgrammingError(msg)

1178

if self._orig_index_file is not None:

1178

if self._orig_index_file is not None:

1179

return None, True

1179

return None, True

1180

any_pending = False

1180

any_pending = False

1181

pending_index_file = self._divert_index()

1181

pending_index_file = self._divert_index()

1182

if self.opener.exists(pending_index_file):

1182

if self.opener.exists(pending_index_file):

1183

self.opener.unlink(pending_index_file)

1183

self.opener.unlink(pending_index_file)

1184

util.copyfile(

1184

util.copyfile(

1185

self.opener.join(self.index_file),

1185

self.opener.join(self.index_file),

1186

self.opener.join(pending_index_file),

1186

self.opener.join(pending_index_file),

1187

)

1187

)

1188

if self._delay_buffer:

1188

if self._delay_buffer:

1189

with self.opener(pending_index_file, b'r+') as ifh:

1189

with self.opener(pending_index_file, b'r+') as ifh:

1190

ifh.seek(0, os.SEEK_END)

1190

ifh.seek(0, os.SEEK_END)

1191

ifh.write(b"".join(self._delay_buffer))

1191

ifh.write(b"".join(self._delay_buffer))

1192

any_pending = True

1192

any_pending = True

1193

self._delay_buffer = None

1193

self._delay_buffer = None

1194

self._orig_index_file = self.index_file

1194

self._orig_index_file = self.index_file

1195

self.index_file = pending_index_file

1195

self.index_file = pending_index_file

1196

return self.index_file, any_pending

1196

return self.index_file, any_pending

1197

1198

def finalize_pending(self):

1198

def finalize_pending(self):

1199

assert not self.is_open

1199

assert not self.is_open

1200

if self.inline:

1200

if self.inline:

1201

msg = "revlog with delayed write should not be inline"

1201

msg = "revlog with delayed write should not be inline"

1202

raise error.ProgrammingError(msg)

1202

raise error.ProgrammingError(msg)

1203

1204

delay = self._delay_buffer is not None

1204

delay = self._delay_buffer is not None

1205

divert = self._orig_index_file is not None

1205

divert = self._orig_index_file is not None

1206

1207

if delay and divert:

1207

if delay and divert:

1208

assert False, "unreachable"

1208

assert False, "unreachable"

1209

elif delay:

1209

elif delay:

1210

if self._delay_buffer:

1210

if self._delay_buffer:

1211

with self.opener(self.index_file, b'r+') as ifh:

1211

with self.opener(self.index_file, b'r+') as ifh:

1212

ifh.seek(0, os.SEEK_END)

1212

ifh.seek(0, os.SEEK_END)

1213

ifh.write(b"".join(self._delay_buffer))

1213

ifh.write(b"".join(self._delay_buffer))

1214

self._delay_buffer = None

1214

self._delay_buffer = None

1215

elif divert:

1215

elif divert:

1216

if self.opener.exists(self.index_file):

1216

if self.opener.exists(self.index_file):

1217

self.opener.rename(

1217

self.opener.rename(

1218

self.index_file,

1218

self.index_file,

1219

self._orig_index_file,

1219

self._orig_index_file,

1220

checkambig=True,

1220

checkambig=True,

1221

)

1221

)

1222

self.index_file = self._orig_index_file

1222

self.index_file = self._orig_index_file

1223

self._orig_index_file = None

1223

self._orig_index_file = None

1224

else:

1224

else:

1225

msg = b"not delay or divert found on this revlog"

1225

msg = b"not delay or divert found on this revlog"

1226

raise error.ProgrammingError(msg)

1226

raise error.ProgrammingError(msg)

1227

return self.canonical_index_file

1227

return self.canonical_index_file

1228

1229

1230

class revlog:

1230

class revlog:

1231

"""

1231

"""

1232

the underlying revision storage object

1232

the underlying revision storage object

1233

1234

A revlog consists of two parts, an index and the revision data.

1234

A revlog consists of two parts, an index and the revision data.

1235

1236

The index is a file with a fixed record size containing

1236

The index is a file with a fixed record size containing

1237

information on each revision, including its nodeid (hash), the

1237

information on each revision, including its nodeid (hash), the

1238

nodeids of its parents, the position and offset of its data within

1238

nodeids of its parents, the position and offset of its data within

1239

the data file, and the revision it's based on. Finally, each entry

1239

the data file, and the revision it's based on. Finally, each entry

1240

contains a linkrev entry that can serve as a pointer to external

1240

contains a linkrev entry that can serve as a pointer to external

1241

data.

1241

data.

1242

1243

The revision data itself is a linear collection of data chunks.

1243

The revision data itself is a linear collection of data chunks.

1244

Each chunk represents a revision and is usually represented as a

1244

Each chunk represents a revision and is usually represented as a

1245

delta against the previous chunk. To bound lookup time, runs of

1245

delta against the previous chunk. To bound lookup time, runs of

1246

deltas are limited to about 2 times the length of the original

1246

deltas are limited to about 2 times the length of the original

1247

version data. This makes retrieval of a version proportional to

1247

version data. This makes retrieval of a version proportional to

1248

its size, or O(1) relative to the number of revisions.

1248

its size, or O(1) relative to the number of revisions.

1249

1250

Both pieces of the revlog are written to in an append-only

1250

Both pieces of the revlog are written to in an append-only

1251

fashion, which means we never need to rewrite a file to insert or

1251

fashion, which means we never need to rewrite a file to insert or

1252

remove data, and can use some simple techniques to avoid the need

1252

remove data, and can use some simple techniques to avoid the need

1253

for locking while reading.

1253

for locking while reading.

1254

1255

If checkambig, indexfile is opened with checkambig=True at

1255

If checkambig, indexfile is opened with checkambig=True at

1256

writing, to avoid file stat ambiguity.

1256

writing, to avoid file stat ambiguity.

1257

1258

If mmaplargeindex is True, and an mmapindexthreshold is set, the

1258

If mmaplargeindex is True, and an mmapindexthreshold is set, the

1259

index will be mmapped rather than read if it is larger than the

1259

index will be mmapped rather than read if it is larger than the

1260

configured threshold.

1260

configured threshold.

1261

1262

If censorable is True, the revlog can have censored revisions.

1262

If censorable is True, the revlog can have censored revisions.

1263

1264

If `upperboundcomp` is not None, this is the expected maximal gain from

1264

If `upperboundcomp` is not None, this is the expected maximal gain from

1265

compression for the data content.

1265

compression for the data content.

1266

1267

`concurrencychecker` is an optional function that receives 3 arguments: a

1267

`concurrencychecker` is an optional function that receives 3 arguments: a

1268

file handle, a filename, and an expected position. It should check whether

1268

file handle, a filename, and an expected position. It should check whether

1269

the current position in the file handle is valid, and log/warn/fail (by

1269

the current position in the file handle is valid, and log/warn/fail (by

1270

raising).

1270

raising).

1271

1272

See mercurial/revlogutils/contants.py for details about the content of an

1272

See mercurial/revlogutils/contants.py for details about the content of an

1273

index entry.

1273

index entry.

1274

"""

1274

"""

1275

1276

_flagserrorclass = error.RevlogError

1276

_flagserrorclass = error.RevlogError

1277

1278

@staticmethod

1278

@staticmethod

1279

def is_inline_index(header_bytes):

1279

def is_inline_index(header_bytes):

1280

"""Determine if a revlog is inline from the initial bytes of the index"""

1280

"""Determine if a revlog is inline from the initial bytes of the index"""

1281

if len(header_bytes) == 0:

1281

if len(header_bytes) == 0:

1282

return True

1282

return True

1283

1284

header = INDEX_HEADER.unpack(header_bytes)[0]

1284

header = INDEX_HEADER.unpack(header_bytes)[0]

1285

1286

_format_flags = header & ~0xFFFF

1286

_format_flags = header & ~0xFFFF

1287

_format_version = header & 0xFFFF

1287

_format_version = header & 0xFFFF

1288

1289

features = FEATURES_BY_VERSION[_format_version]

1289

features = FEATURES_BY_VERSION[_format_version]

1290

return features[b'inline'](_format_flags)

1290

return features[b'inline'](_format_flags)

1291

1292

def __init__(

1292

def __init__(

1293

self,

1293

self,

1294

opener,

1294

opener,

1295

target,

1295

target,

1296

radix,

1296

radix,

1297

postfix=None, # only exist for `tmpcensored` now

1297

postfix=None, # only exist for `tmpcensored` now

1298

checkambig=False,

1298

checkambig=False,

1299

mmaplargeindex=False,

1299

mmaplargeindex=False,

1300

censorable=False,

1300

censorable=False,

1301

upperboundcomp=None,

1301

upperboundcomp=None,

1302

persistentnodemap=False,

1302

persistentnodemap=False,

1303

concurrencychecker=None,

1303

concurrencychecker=None,

1304

trypending=False,

1304

trypending=False,

1305

try_split=False,

1305

try_split=False,

1306

canonical_parent_order=True,

1306

canonical_parent_order=True,

1307

data_config=None,

1307

data_config=None,

1308

delta_config=None,

1308

delta_config=None,

1309

feature_config=None,

1309

feature_config=None,

1310

may_inline=True, # may inline new revlog

1310

may_inline=True, # may inline new revlog

1311

):

1311

):

1312

"""

1312

"""

1313

create a revlog object

1313

create a revlog object

1314

1315

opener is a function that abstracts the file opening operation

1315

opener is a function that abstracts the file opening operation

1316

and can be used to implement COW semantics or the like.

1316

and can be used to implement COW semantics or the like.

1317

1318

`target`: a (KIND, ID) tuple that identify the content stored in

1318

`target`: a (KIND, ID) tuple that identify the content stored in

1319

this revlog. It help the rest of the code to understand what the revlog

1319

this revlog. It help the rest of the code to understand what the revlog

1320

is about without having to resort to heuristic and index filename

1320

is about without having to resort to heuristic and index filename

1321

analysis. Note: that this must be reliably be set by normal code, but

1321

analysis. Note: that this must be reliably be set by normal code, but

1322

that test, debug, or performance measurement code might not set this to

1322

that test, debug, or performance measurement code might not set this to

1323

accurate value.

1323

accurate value.

1324

"""

1324

"""

1325

1326

self.radix = radix

1326

self.radix = radix

1327

1328

self._docket_file = None

1328

self._docket_file = None

1329

self._indexfile = None

1329

self._indexfile = None

1330

self._datafile = None

1330

self._datafile = None

1331

self._sidedatafile = None

1331

self._sidedatafile = None

1332

self._nodemap_file = None

1332

self._nodemap_file = None

1333

self.postfix = postfix

1333

self.postfix = postfix

1334

self._trypending = trypending

1334

self._trypending = trypending

1335

self._try_split = try_split

1335

self._try_split = try_split

1336

self._may_inline = may_inline

1336

self._may_inline = may_inline

1337

self.opener = opener

1337

self.opener = opener

1338

if persistentnodemap:

1338

if persistentnodemap:

1339

self._nodemap_file = nodemaputil.get_nodemap_file(self)

1339

self._nodemap_file = nodemaputil.get_nodemap_file(self)

1340

1341

assert target[0] in ALL_KINDS

1341

assert target[0] in ALL_KINDS

1342

assert len(target) == 2

1342

assert len(target) == 2

1343

self.target = target

1343

self.target = target

1344

if feature_config is not None:

1344

if feature_config is not None:

1345

self.feature_config = feature_config.copy()

1345

self.feature_config = feature_config.copy()

1346

elif b'feature-config' in self.opener.options:

1346

elif b'feature-config' in self.opener.options:

1347

self.feature_config = self.opener.options[b'feature-config'].copy()

1347

self.feature_config = self.opener.options[b'feature-config'].copy()

1348

else:

1348

else:

1349

self.feature_config = FeatureConfig()

1349

self.feature_config = FeatureConfig()

1350

self.feature_config.censorable = censorable

1350

self.feature_config.censorable = censorable

1351

self.feature_config.canonical_parent_order = canonical_parent_order

1351

self.feature_config.canonical_parent_order = canonical_parent_order

1352

if data_config is not None:

1352

if data_config is not None:

1353

self.data_config = data_config.copy()

1353

self.data_config = data_config.copy()

1354

elif b'data-config' in self.opener.options:

1354

elif b'data-config' in self.opener.options:

1355

self.data_config = self.opener.options[b'data-config'].copy()

1355

self.data_config = self.opener.options[b'data-config'].copy()

1356

else:

1356

else:

1357

self.data_config = DataConfig()

1357

self.data_config = DataConfig()

1358

self.data_config.check_ambig = checkambig

1358

self.data_config.check_ambig = checkambig

1359

self.data_config.mmap_large_index = mmaplargeindex

1359

self.data_config.mmap_large_index = mmaplargeindex

1360

if delta_config is not None:

1360

if delta_config is not None:

1361

self.delta_config = delta_config.copy()

1361

self.delta_config = delta_config.copy()

1362

elif b'delta-config' in self.opener.options:

1362

elif b'delta-config' in self.opener.options:

1363

self.delta_config = self.opener.options[b'delta-config'].copy()

1363

self.delta_config = self.opener.options[b'delta-config'].copy()

1364

else:

1364

else:

1365

self.delta_config = DeltaConfig()

1365

self.delta_config = DeltaConfig()

1366

self.delta_config.upper_bound_comp = upperboundcomp

1366

self.delta_config.upper_bound_comp = upperboundcomp

1367

1368

# Maps rev to chain base rev.

1368

# Maps rev to chain base rev.

1369

self._chainbasecache = util.lrucachedict(100)

1369

self._chainbasecache = util.lrucachedict(100)

1370

1371

self.index = None

1371

self.index = None

1372

self._docket = None

1372

self._docket = None

1373

self._nodemap_docket = None

1373

self._nodemap_docket = None

1374

# Mapping of partial identifiers to full nodes.

1374

# Mapping of partial identifiers to full nodes.

1375

self._pcache = {}

1375

self._pcache = {}

1376

1377

# other optionnals features

1377

# other optionnals features

1378

1379

# Make copy of flag processors so each revlog instance can support

1379

# Make copy of flag processors so each revlog instance can support

1380

# custom flags.

1380

# custom flags.

1381

self._flagprocessors = dict(flagutil.flagprocessors)

1381

self._flagprocessors = dict(flagutil.flagprocessors)

1382

# prevent nesting of addgroup

1382

# prevent nesting of addgroup

1383

self._adding_group = None

1383

self._adding_group = None

1384

1385

chunk_cache = self._loadindex()

1385

chunk_cache = self._loadindex()

1386

self._load_inner(chunk_cache)

1386

self._load_inner(chunk_cache)

1387

self._concurrencychecker = concurrencychecker

1387

self._concurrencychecker = concurrencychecker

1388

1389

def _init_opts(self):

1389

def _init_opts(self):

1390

"""process options (from above/config) to setup associated default revlog mode

1390

"""process options (from above/config) to setup associated default revlog mode

1391

1392

These values might be affected when actually reading on disk information.

1392

These values might be affected when actually reading on disk information.

1393

1394

The relevant values are returned for use in _loadindex().

1394

The relevant values are returned for use in _loadindex().

1395

1396

* newversionflags:

1396

* newversionflags:

1397

version header to use if we need to create a new revlog

1397

version header to use if we need to create a new revlog

1398

1399

* mmapindexthreshold:

1399

* mmapindexthreshold:

1400

minimal index size for start to use mmap

1400

minimal index size for start to use mmap

1401

1402

* force_nodemap:

1402

* force_nodemap:

1403

force the usage of a "development" version of the nodemap code

1403

force the usage of a "development" version of the nodemap code

1404

"""

1404

"""

1405

opts = self.opener.options

1405

opts = self.opener.options

1406

1407

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

1407

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

1408

new_header = CHANGELOGV2

1408

new_header = CHANGELOGV2

1409

compute_rank = opts.get(b'changelogv2.compute-rank', True)

1409

compute_rank = opts.get(b'changelogv2.compute-rank', True)

1410

self.feature_config.compute_rank = compute_rank

1410

self.feature_config.compute_rank = compute_rank

1411

elif b'revlogv2' in opts:

1411

elif b'revlogv2' in opts:

1412

new_header = REVLOGV2

1412

new_header = REVLOGV2

1413

elif b'revlogv1' in opts:

1413

elif b'revlogv1' in opts:

1414

new_header = REVLOGV1

1414

new_header = REVLOGV1

1415

if self._may_inline:

1415

if self._may_inline:

1416

new_header |= FLAG_INLINE_DATA

1416

new_header |= FLAG_INLINE_DATA

1417

if b'generaldelta' in opts:

1417

if b'generaldelta' in opts:

1418

new_header |= FLAG_GENERALDELTA

1418

new_header |= FLAG_GENERALDELTA

1419

elif b'revlogv0' in self.opener.options:

1419

elif b'revlogv0' in self.opener.options:

1420

new_header = REVLOGV0

1420

new_header = REVLOGV0

1421

else:

1421

else:

1422

new_header = REVLOG_DEFAULT_VERSION

1422

new_header = REVLOG_DEFAULT_VERSION

1423

1424

mmapindexthreshold = None

1424

mmapindexthreshold = None

1425

if self.data_config.mmap_large_index:

1425

if self.data_config.mmap_large_index:

1426

mmapindexthreshold = self.data_config.mmap_index_threshold

1426

mmapindexthreshold = self.data_config.mmap_index_threshold

1427

if self.feature_config.enable_ellipsis:

1427

if self.feature_config.enable_ellipsis:

1428

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

1428

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

1429

1430

# revlog v0 doesn't have flag processors

1430

# revlog v0 doesn't have flag processors

1431

for flag, processor in opts.get(b'flagprocessors', {}).items():

1431

for flag, processor in opts.get(b'flagprocessors', {}).items():

1432

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

1432

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

1433

1434

chunk_cache_size = self.data_config.chunk_cache_size

1434

chunk_cache_size = self.data_config.chunk_cache_size

1435

if chunk_cache_size <= 0:

1435

if chunk_cache_size <= 0:

1436

raise error.RevlogError(

1436

raise error.RevlogError(

1437

_(b'revlog chunk cache size %r is not greater than 0')

1437

_(b'revlog chunk cache size %r is not greater than 0')

1438

% chunk_cache_size

1438

% chunk_cache_size

1439

)

1439

)

1440

elif chunk_cache_size & (chunk_cache_size - 1):

1440

elif chunk_cache_size & (chunk_cache_size - 1):

1441

raise error.RevlogError(

1441

raise error.RevlogError(

1442

_(b'revlog chunk cache size %r is not a power of 2')

1442

_(b'revlog chunk cache size %r is not a power of 2')

1443

% chunk_cache_size

1443

% chunk_cache_size

1444

)

1444

)

1445

force_nodemap = opts.get(b'devel-force-nodemap', False)

1445

force_nodemap = opts.get(b'devel-force-nodemap', False)

1446

return new_header, mmapindexthreshold, force_nodemap

1446

return new_header, mmapindexthreshold, force_nodemap

1447

1448

def _get_data(self, filepath, mmap_threshold, size=None):

1448

def _get_data(self, filepath, mmap_threshold, size=None):

1449

"""return a file content with or without mmap

1449

"""return a file content with or without mmap

1450

1451

If the file is missing return the empty string"""

1451

If the file is missing return the empty string"""

1452

try:

1452

try:

1453

with self.opener(filepath) as fp:

1453

with self.opener(filepath) as fp:

1454

if mmap_threshold is not None:

1454

if mmap_threshold is not None:

1455

file_size = self.opener.fstat(fp).st_size

1455

file_size = self.opener.fstat(fp).st_size

1456

if file_size >= mmap_threshold:

1456

if file_size >= mmap_threshold:

1457

if size is not None:

1457

if size is not None:

1458

# avoid potentiel mmap crash

1458

# avoid potentiel mmap crash

1459

size = min(file_size, size)

1459

size = min(file_size, size)

1460

# TODO: should .close() to release resources without

1460

# TODO: should .close() to release resources without

1461

# relying on Python GC

1461

# relying on Python GC

1462

if size is None:

1462

if size is None:

1463

return util.buffer(util.mmapread(fp))

1463

return util.buffer(util.mmapread(fp))

1464

else:

1464

else:

1465

return util.buffer(util.mmapread(fp, size))

1465

return util.buffer(util.mmapread(fp, size))

1466

if size is None:

1466

if size is None:

1467

return fp.read()

1467

return fp.read()

1468

else:

1468

else:

1469

return fp.read(size)

1469

return fp.read(size)

1470

except FileNotFoundError:

1470

except FileNotFoundError:

1471

return b''

1471

return b''

1472

1473

def get_streams(self, max_linkrev, force_inline=False):

1473

def get_streams(self, max_linkrev, force_inline=False):

1474

"""return a list of streams that represent this revlog

1474

"""return a list of streams that represent this revlog

1475

1476

This is used by stream-clone to do bytes to bytes copies of a repository.

1476

This is used by stream-clone to do bytes to bytes copies of a repository.

1477

1478

This streams data for all revisions that refer to a changelog revision up

1478

This streams data for all revisions that refer to a changelog revision up

1479

to `max_linkrev`.

1479

to `max_linkrev`.

1480

1481

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

1481

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

1482

1483

It returns is a list of three-tuple:

1483

It returns is a list of three-tuple:

1484

1485

[

1485

[

1486

(filename, bytes_stream, stream_size),

1486

(filename, bytes_stream, stream_size),

1487

…

1487

…

1488

]

1488

]

1489

"""

1489

"""

1490

n = len(self)

1490

n = len(self)

1491

index = self.index

1491

index = self.index

1492

while n > 0:

1492

while n > 0:

1493

linkrev = index[n - 1][4]

1493

linkrev = index[n - 1][4]

1494

if linkrev < max_linkrev:

1494

if linkrev < max_linkrev:

1495

break

1495

break

1496

# note: this loop will rarely go through multiple iterations, since

1496

# note: this loop will rarely go through multiple iterations, since

1497

# it only traverses commits created during the current streaming

1497

# it only traverses commits created during the current streaming

1498

# pull operation.

1498

# pull operation.

1499

#

1499

#

1500

# If this become a problem, using a binary search should cap the

1500

# If this become a problem, using a binary search should cap the

1501

# runtime of this.

1501

# runtime of this.

1502

n = n - 1

1502

n = n - 1

1503

if n == 0:

1503

if n == 0:

1504

# no data to send

1504

# no data to send

1505

return []

1505

return []

1506

index_size = n * index.entry_size

1506

index_size = n * index.entry_size

1507

data_size = self.end(n - 1)

1507

data_size = self.end(n - 1)

1508

1509

# XXX we might have been split (or stripped) since the object

1509

# XXX we might have been split (or stripped) since the object

1510

# initialization, We need to close this race too, but having a way to

1510

# initialization, We need to close this race too, but having a way to

1511

# pre-open the file we feed to the revlog and never closing them before

1511

# pre-open the file we feed to the revlog and never closing them before

1512

# we are done streaming.

1512

# we are done streaming.

1513

1514

if self._inline:

1514

if self._inline:

1515

1516

def get_stream():

1516

def get_stream():

1517

with self.opener(self._indexfile, mode=b"r") as fp:

1517

with self.opener(self._indexfile, mode=b"r") as fp:

1518

yield None

1518

yield None

1519

size = index_size + data_size

1519

size = index_size + data_size

1520

if size <= 65536:

1520

if size <= 65536:

1521

yield fp.read(size)

1521

yield fp.read(size)

1522

else:

1522

else:

1523

yield from util.filechunkiter(fp, limit=size)

1523

yield from util.filechunkiter(fp, limit=size)

1524

1525

inline_stream = get_stream()

1525

inline_stream = get_stream()

1526

next(inline_stream)

1526

next(inline_stream)

1527

return [

1527

return [

1528

(self._indexfile, inline_stream, index_size + data_size),

1528

(self._indexfile, inline_stream, index_size + data_size),

1529

]

1529

]

1530

elif force_inline:

1530

elif force_inline:

1531

1532

def get_stream():

1532

def get_stream():

1533

with self.reading():

1533

with self.reading():

1534

yield None

1534

yield None

1535

1536

for rev in range(n):

1536

for rev in range(n):

1537

idx = self.index.entry_binary(rev)

1537

idx = self.index.entry_binary(rev)

1538

if rev == 0 and self._docket is None:

1538

if rev == 0 and self._docket is None:

1539

# re-inject the inline flag

1539

# re-inject the inline flag

1540

header = self._format_flags

1540

header = self._format_flags

1541

header |= self._format_version

1541

header |= self._format_version

1542

header |= FLAG_INLINE_DATA

1542

header |= FLAG_INLINE_DATA

1543

header = self.index.pack_header(header)

1543

header = self.index.pack_header(header)

1544

idx = header + idx

1544

idx = header + idx

1545

yield idx

1545

yield idx

1546

yield self._inner.get_segment_for_revs(rev, rev)[1]

1546

yield self._inner.get_segment_for_revs(rev, rev)[1]

1547

1548

inline_stream = get_stream()

1548

inline_stream = get_stream()

1549

next(inline_stream)

1549

next(inline_stream)

1550

return [

1550

return [

1551

(self._indexfile, inline_stream, index_size + data_size),

1551

(self._indexfile, inline_stream, index_size + data_size),

1552

]

1552

]

1553

else:

1553

else:

1554

1555

def get_index_stream():

1555

def get_index_stream():

1556

with self.opener(self._indexfile, mode=b"r") as fp:

1556

with self.opener(self._indexfile, mode=b"r") as fp:

1557

yield None

1557

yield None

1558

if index_size <= 65536:

1558

if index_size <= 65536:

1559

yield fp.read(index_size)

1559

yield fp.read(index_size)

1560

else:

1560

else:

1561

yield from util.filechunkiter(fp, limit=index_size)

1561

yield from util.filechunkiter(fp, limit=index_size)

1562

1563

def get_data_stream():

1563

def get_data_stream():

1564

with self._datafp() as fp:

1564

with self._datafp() as fp:

1565

yield None

1565

yield None

1566

if data_size <= 65536:

1566

if data_size <= 65536:

1567

yield fp.read(data_size)

1567

yield fp.read(data_size)

1568

else:

1568

else:

1569

yield from util.filechunkiter(fp, limit=data_size)

1569

yield from util.filechunkiter(fp, limit=data_size)

1570

1571

index_stream = get_index_stream()

1571

index_stream = get_index_stream()

1572

next(index_stream)

1572

next(index_stream)

1573

data_stream = get_data_stream()

1573

data_stream = get_data_stream()

1574

next(data_stream)

1574

next(data_stream)

1575

return [

1575

return [

1576

(self._datafile, data_stream, data_size),

1576

(self._datafile, data_stream, data_size),

1577

(self._indexfile, index_stream, index_size),

1577

(self._indexfile, index_stream, index_size),

1578

]

1578

]

1579

1580

def _loadindex(self, docket=None):

1580

def _loadindex(self, docket=None):

1581

1582

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

1582

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

1583

1584

if self.postfix is not None:

1584

if self.postfix is not None:

1585

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

1585

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

1586

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

1586

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

1587

entry_point = b'%s.i.a' % self.radix

1587

entry_point = b'%s.i.a' % self.radix

1588

elif self._try_split and self.opener.exists(self._split_index_file):

1588

elif self._try_split and self.opener.exists(self._split_index_file):

1589

entry_point = self._split_index_file

1589

entry_point = self._split_index_file

1590

else:

1590

else:

1591

entry_point = b'%s.i' % self.radix

1591

entry_point = b'%s.i' % self.radix

1592

1593

if docket is not None:

1593

if docket is not None:

1594

self._docket = docket

1594

self._docket = docket

1595

self._docket_file = entry_point

1595

self._docket_file = entry_point

1596

else:

1596

else:

1597

self._initempty = True

1597

self._initempty = True

1598

entry_data = self._get_data(entry_point, mmapindexthreshold)

1598

entry_data = self._get_data(entry_point, mmapindexthreshold)

1599

if len(entry_data) > 0:

1599

if len(entry_data) > 0:

1600

header = INDEX_HEADER.unpack(entry_data[:4])[0]

1600

header = INDEX_HEADER.unpack(entry_data[:4])[0]

1601

self._initempty = False

1601

self._initempty = False

1602

else:

1602

else:

1603

header = new_header

1603

header = new_header

1604

1605

self._format_flags = header & ~0xFFFF

1605

self._format_flags = header & ~0xFFFF

1606

self._format_version = header & 0xFFFF

1606

self._format_version = header & 0xFFFF

1607

1608

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

1608

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

1609

if supported_flags is None:

1609

if supported_flags is None:

1610

msg = _(b'unknown version (%d) in revlog %s')

1610

msg = _(b'unknown version (%d) in revlog %s')

1611

msg %= (self._format_version, self.display_id)

1611

msg %= (self._format_version, self.display_id)

1612

raise error.RevlogError(msg)

1612

raise error.RevlogError(msg)

1613

elif self._format_flags & ~supported_flags:

1613

elif self._format_flags & ~supported_flags:

1614

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

1614

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

1615

display_flag = self._format_flags >> 16

1615

display_flag = self._format_flags >> 16

1616

msg %= (display_flag, self._format_version, self.display_id)

1616

msg %= (display_flag, self._format_version, self.display_id)

1617

raise error.RevlogError(msg)

1617

raise error.RevlogError(msg)

1618

1619

features = FEATURES_BY_VERSION[self._format_version]

1619

features = FEATURES_BY_VERSION[self._format_version]

1620

self._inline = features[b'inline'](self._format_flags)

1620

self._inline = features[b'inline'](self._format_flags)

1621

self.delta_config.general_delta = features[b'generaldelta'](

1621

self.delta_config.general_delta = features[b'generaldelta'](

1622

self._format_flags

1622

self._format_flags

1623

)

1623

)

1624

self.feature_config.has_side_data = features[b'sidedata']

1624

self.feature_config.has_side_data = features[b'sidedata']

1625

1626

if not features[b'docket']:

1626

if not features[b'docket']:

1627

self._indexfile = entry_point

1627

self._indexfile = entry_point

1628

index_data = entry_data

1628

index_data = entry_data

1629

else:

1629

else:

1630

self._docket_file = entry_point

1630

self._docket_file = entry_point

1631

if self._initempty:

1631

if self._initempty:

1632

self._docket = docketutil.default_docket(self, header)

1632

self._docket = docketutil.default_docket(self, header)

1633

else:

1633

else:

1634

self._docket = docketutil.parse_docket(

1634

self._docket = docketutil.parse_docket(

1635

self, entry_data, use_pending=self._trypending

1635

self, entry_data, use_pending=self._trypending

1636

)

1636

)

1637

1638

if self._docket is not None:

1638

if self._docket is not None:

1639

self._indexfile = self._docket.index_filepath()

1639

self._indexfile = self._docket.index_filepath()

1640

index_data = b''

1640

index_data = b''

1641

index_size = self._docket.index_end

1641

index_size = self._docket.index_end

1642

if index_size > 0:

1642

if index_size > 0:

1643

index_data = self._get_data(

1643

index_data = self._get_data(

1644

self._indexfile, mmapindexthreshold, size=index_size

1644

self._indexfile, mmapindexthreshold, size=index_size

1645

)

1645

)

1646

if len(index_data) < index_size:

1646

if len(index_data) < index_size:

1647

msg = _(b'too few index data for %s: got %d, expected %d')

1647

msg = _(b'too few index data for %s: got %d, expected %d')

1648

msg %= (self.display_id, len(index_data), index_size)

1648

msg %= (self.display_id, len(index_data), index_size)

1649

raise error.RevlogError(msg)

1649

raise error.RevlogError(msg)

1650

1651

self._inline = False

1651

self._inline = False

1652

# generaldelta implied by version 2 revlogs.

1652

# generaldelta implied by version 2 revlogs.

1653

self.delta_config.general_delta = True

1653

self.delta_config.general_delta = True

1654

# the logic for persistent nodemap will be dealt with within the

1654

# the logic for persistent nodemap will be dealt with within the

1655

# main docket, so disable it for now.

1655

# main docket, so disable it for now.

1656

self._nodemap_file = None

1656

self._nodemap_file = None

1657

1658

if self._docket is not None:

1658

if self._docket is not None:

1659

self._datafile = self._docket.data_filepath()

1659

self._datafile = self._docket.data_filepath()

1660

self._sidedatafile = self._docket.sidedata_filepath()

1660

self._sidedatafile = self._docket.sidedata_filepath()

1661

elif self.postfix is None:

1661

elif self.postfix is None:

1662

self._datafile = b'%s.d' % self.radix

1662

self._datafile = b'%s.d' % self.radix

1663

else:

1663

else:

1664

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

1664

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

1665

1666

self.nodeconstants = sha1nodeconstants

1666

self.nodeconstants = sha1nodeconstants

1667

self.nullid = self.nodeconstants.nullid

1667

self.nullid = self.nodeconstants.nullid

1668

1669

# sparse-revlog can't be on without general-delta (issue6056)

1669

# sparse-revlog can't be on without general-delta (issue6056)

1670

if not self.delta_config.general_delta:

1670

if not self.delta_config.general_delta:

1671

self.delta_config.sparse_revlog = False

1671

self.delta_config.sparse_revlog = False

1672

1673

self._storedeltachains = True

1673

self._storedeltachains = True

1674

1675

devel_nodemap = (

1675

devel_nodemap = (

1676

self._nodemap_file

1676

self._nodemap_file

1677

and force_nodemap

1677

and force_nodemap

1678

and parse_index_v1_nodemap is not None

1678

and parse_index_v1_nodemap is not None

1679

)

1679

)

1680

1681

use_rust_index = False

1681

use_rust_index = False

1682

if rustrevlog is not None:

1682

if rustrevlog is not None:

1683

if self._nodemap_file is not None:

1683

if self._nodemap_file is not None:

1684

use_rust_index = True

1684

use_rust_index = True

1685

else:

1685

else:

1686

# Using the CIndex is not longer possible, as the

1686

# Using the CIndex is not longer possible, as the

1687

# `AncestorsIterator` and `LazyAncestors` classes now require

1687

# `AncestorsIterator` and `LazyAncestors` classes now require

1688

# a Rust index for instantiation.

1688

# a Rust index for instantiation.

1689

use_rust_index = True

1689

use_rust_index = True

1690

1691

self._parse_index = parse_index_v1

1691

self._parse_index = parse_index_v1

1692

if self._format_version == REVLOGV0:

1692

if self._format_version == REVLOGV0:

1693

self._parse_index = revlogv0.parse_index_v0

1693

self._parse_index = revlogv0.parse_index_v0

1694

elif self._format_version == REVLOGV2:

1694

elif self._format_version == REVLOGV2:

1695

self._parse_index = parse_index_v2

1695

self._parse_index = parse_index_v2

1696

elif self._format_version == CHANGELOGV2:

1696

elif self._format_version == CHANGELOGV2:

1697

self._parse_index = parse_index_cl_v2

1697

self._parse_index = parse_index_cl_v2

1698

elif devel_nodemap:

1698

elif devel_nodemap:

1699

self._parse_index = parse_index_v1_nodemap

1699

self._parse_index = parse_index_v1_nodemap

1700

elif use_rust_index:

1700

elif use_rust_index:

1701

self._parse_index = functools.partial(

1701

self._parse_index = functools.partial(

1702

parse_index_v1_~~mixed~~, default_header=new_header

1702

parse_index_v1_rust, default_header=new_header

1703

)

1703

)

1704

try:

1704

try:

1705

d = self._parse_index(index_data, self._inline)

1705

d = self._parse_index(index_data, self._inline)

1706

index, chunkcache = d

1706

index, chunkcache = d

1707

use_nodemap = (

1707

use_nodemap = (

1708

not self._inline

1708

not self._inline

1709

and self._nodemap_file is not None

1709

and self._nodemap_file is not None

1710

and hasattr(index, 'update_nodemap_data')

1710

and hasattr(index, 'update_nodemap_data')

1711

)

1711

)

1712

if use_nodemap:

1712

if use_nodemap:

1713

nodemap_data = nodemaputil.persisted_data(self)

1713

nodemap_data = nodemaputil.persisted_data(self)

1714

if nodemap_data is not None:

1714

if nodemap_data is not None:

1715

docket = nodemap_data[0]

1715

docket = nodemap_data[0]

1716

if (

1716

if (

1717

len(d[0]) > docket.tip_rev

1717

len(d[0]) > docket.tip_rev

1718

and d[0][docket.tip_rev][7] == docket.tip_node

1718

and d[0][docket.tip_rev][7] == docket.tip_node

1719

):

1719

):

1720

# no changelog tampering

1720

# no changelog tampering

1721

self._nodemap_docket = docket

1721

self._nodemap_docket = docket

1722

index.update_nodemap_data(*nodemap_data)

1722

index.update_nodemap_data(*nodemap_data)

1723

except (ValueError, IndexError):

1723

except (ValueError, IndexError):

1724

raise error.RevlogError(

1724

raise error.RevlogError(

1725

_(b"index %s is corrupted") % self.display_id

1725

_(b"index %s is corrupted") % self.display_id

1726

)

1726

)

1727

self.index = index

1727

self.index = index

1728

# revnum -> (chain-length, sum-delta-length)

1728

# revnum -> (chain-length, sum-delta-length)

1729

self._chaininfocache = util.lrucachedict(500)

1729

self._chaininfocache = util.lrucachedict(500)

1730

1731

return chunkcache

1731

return chunkcache

1732

1733

def _load_inner(self, chunk_cache):

1733

def _load_inner(self, chunk_cache):

1734

if self._docket is None:

1734

if self._docket is None:

1735

default_compression_header = None

1735

default_compression_header = None

1736

else:

1736

else:

1737

default_compression_header = self._docket.default_compression_header

1737

default_compression_header = self._docket.default_compression_header

1738

1739

self._inner = _InnerRevlog(

1739

self._inner = _InnerRevlog(

1740

opener=self.opener,

1740

opener=self.opener,

1741

index=self.index,

1741

index=self.index,

1742

index_file=self._indexfile,

1742

index_file=self._indexfile,

1743

data_file=self._datafile,

1743

data_file=self._datafile,

1744

sidedata_file=self._sidedatafile,

1744

sidedata_file=self._sidedatafile,

1745

inline=self._inline,

1745

inline=self._inline,

1746

data_config=self.data_config,

1746

data_config=self.data_config,

1747

delta_config=self.delta_config,

1747

delta_config=self.delta_config,

1748

feature_config=self.feature_config,

1748

feature_config=self.feature_config,

1749

chunk_cache=chunk_cache,

1749

chunk_cache=chunk_cache,

1750

default_compression_header=default_compression_header,

1750

default_compression_header=default_compression_header,

1751

)

1751

)

1752

1753

def get_revlog(self):

1753

def get_revlog(self):

1754

"""simple function to mirror API of other not-really-revlog API"""

1754

"""simple function to mirror API of other not-really-revlog API"""

1755

return self

1755

return self

1756

1757

@util.propertycache

1757

@util.propertycache

1758

def revlog_kind(self):

1758

def revlog_kind(self):

1759

return self.target[0]

1759

return self.target[0]

1760

1761

@util.propertycache

1761

@util.propertycache

1762

def display_id(self):

1762

def display_id(self):

1763

"""The public facing "ID" of the revlog that we use in message"""

1763

"""The public facing "ID" of the revlog that we use in message"""

1764

if self.revlog_kind == KIND_FILELOG:

1764

if self.revlog_kind == KIND_FILELOG:

1765

# Reference the file without the "data/" prefix, so it is familiar

1765

# Reference the file without the "data/" prefix, so it is familiar

1766

# to the user.

1766

# to the user.

1767

return self.target[1]

1767

return self.target[1]

1768

else:

1768

else:

1769

return self.radix

1769

return self.radix

1770

1771

def _datafp(self, mode=b'r'):

1771

def _datafp(self, mode=b'r'):

1772

"""file object for the revlog's data file"""

1772

"""file object for the revlog's data file"""

1773

return self.opener(self._datafile, mode=mode)

1773

return self.opener(self._datafile, mode=mode)

1774

1775

def tiprev(self):

1775

def tiprev(self):

1776

return len(self.index) - 1

1776

return len(self.index) - 1

1777

1778

def tip(self):

1778

def tip(self):

1779

return self.node(self.tiprev())

1779

return self.node(self.tiprev())

1780

1781

def __contains__(self, rev):

1781

def __contains__(self, rev):

1782

return 0 <= rev < len(self)

1782

return 0 <= rev < len(self)

1783

1784

def __len__(self):

1784

def __len__(self):

1785

return len(self.index)

1785

return len(self.index)

1786

1787

def __iter__(self):

1787

def __iter__(self):

1788

return iter(range(len(self)))

1788

return iter(range(len(self)))

1789

1790

def revs(self, start=0, stop=None):

1790

def revs(self, start=0, stop=None):

1791

"""iterate over all rev in this revlog (from start to stop)"""

1791

"""iterate over all rev in this revlog (from start to stop)"""

1792

return storageutil.iterrevs(len(self), start=start, stop=stop)

1792

return storageutil.iterrevs(len(self), start=start, stop=stop)

1793

1794

def hasnode(self, node):

1794

def hasnode(self, node):

1795

try:

1795

try:

1796

self.rev(node)

1796

self.rev(node)

1797

return True

1797

return True

1798

except KeyError:

1798

except KeyError:

1799

return False

1799

return False

1800

1801

def _candelta(self, baserev, rev):

1801

def _candelta(self, baserev, rev):

1802

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1802

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1803

# Disable delta if either rev requires a content-changing flag

1803

# Disable delta if either rev requires a content-changing flag

1804

# processor (ex. LFS). This is because such flag processor can alter

1804

# processor (ex. LFS). This is because such flag processor can alter

1805

# the rawtext content that the delta will be based on, and two clients

1805

# the rawtext content that the delta will be based on, and two clients

1806

# could have a same revlog node with different flags (i.e. different

1806

# could have a same revlog node with different flags (i.e. different

1807

# rawtext contents) and the delta could be incompatible.

1807

# rawtext contents) and the delta could be incompatible.

1808

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1808

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1809

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1809

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1810

):

1810

):

1811

return False

1811

return False

1812

return True

1812

return True

1813

1814

def update_caches(self, transaction):

1814

def update_caches(self, transaction):

1815

"""update on disk cache

1815

"""update on disk cache

1816

1817

If a transaction is passed, the update may be delayed to transaction

1817

If a transaction is passed, the update may be delayed to transaction

1818

commit."""

1818

commit."""

1819

if self._nodemap_file is not None:

1819

if self._nodemap_file is not None:

1820

if transaction is None:

1820

if transaction is None:

1821

nodemaputil.update_persistent_nodemap(self)

1821

nodemaputil.update_persistent_nodemap(self)

1822

else:

1822

else:

1823

nodemaputil.setup_persistent_nodemap(transaction, self)

1823

nodemaputil.setup_persistent_nodemap(transaction, self)

1824

1825

def clearcaches(self):

1825

def clearcaches(self):

1826

"""Clear in-memory caches"""

1826

"""Clear in-memory caches"""

1827

self._chainbasecache.clear()

1827

self._chainbasecache.clear()

1828

self._inner.clear_cache()

1828

self._inner.clear_cache()

1829

self._pcache = {}

1829

self._pcache = {}

1830

self._nodemap_docket = None

1830

self._nodemap_docket = None

1831

self.index.clearcaches()

1831

self.index.clearcaches()

1832

# The python code is the one responsible for validating the docket, we

1832

# The python code is the one responsible for validating the docket, we

1833

# end up having to refresh it here.

1833

# end up having to refresh it here.

1834

use_nodemap = (

1834

use_nodemap = (

1835

not self._inline

1835

not self._inline

1836

and self._nodemap_file is not None

1836

and self._nodemap_file is not None

1837

and hasattr(self.index, 'update_nodemap_data')

1837

and hasattr(self.index, 'update_nodemap_data')

1838

)

1838

)

1839

if use_nodemap:

1839

if use_nodemap:

1840

nodemap_data = nodemaputil.persisted_data(self)

1840

nodemap_data = nodemaputil.persisted_data(self)

1841

if nodemap_data is not None:

1841

if nodemap_data is not None:

1842

self._nodemap_docket = nodemap_data[0]

1842

self._nodemap_docket = nodemap_data[0]

1843

self.index.update_nodemap_data(*nodemap_data)

1843

self.index.update_nodemap_data(*nodemap_data)

1844

1845

def rev(self, node):

1845

def rev(self, node):

1846

"""return the revision number associated with a <nodeid>"""

1846

"""return the revision number associated with a <nodeid>"""

1847

try:

1847

try:

1848

return self.index.rev(node)

1848

return self.index.rev(node)

1849

except TypeError:

1849

except TypeError:

1850

raise

1850

raise

1851

except error.RevlogError:

1851

except error.RevlogError:

1852

# parsers.c radix tree lookup failed

1852

# parsers.c radix tree lookup failed

1853

if (

1853

if (

1854

node == self.nodeconstants.wdirid

1854

node == self.nodeconstants.wdirid

1855

or node in self.nodeconstants.wdirfilenodeids

1855

or node in self.nodeconstants.wdirfilenodeids

1856

):

1856

):

1857

raise error.WdirUnsupported

1857

raise error.WdirUnsupported

1858

raise error.LookupError(node, self.display_id, _(b'no node'))

1858

raise error.LookupError(node, self.display_id, _(b'no node'))

1859

1860

# Accessors for index entries.

1860

# Accessors for index entries.

1861

1862

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1862

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1863

# are flags.

1863

# are flags.

1864

def start(self, rev):

1864

def start(self, rev):

1865

return int(self.index[rev][0] >> 16)

1865

return int(self.index[rev][0] >> 16)

1866

1867

def sidedata_cut_off(self, rev):

1867

def sidedata_cut_off(self, rev):

1868

sd_cut_off = self.index[rev][8]

1868

sd_cut_off = self.index[rev][8]

1869

if sd_cut_off != 0:

1869

if sd_cut_off != 0:

1870

return sd_cut_off

1870

return sd_cut_off

1871

# This is some annoying dance, because entries without sidedata

1871

# This is some annoying dance, because entries without sidedata

1872

# currently use 0 as their ofsset. (instead of previous-offset +

1872

# currently use 0 as their ofsset. (instead of previous-offset +

1873

# previous-size)

1873

# previous-size)

1874

#

1874

#

1875

# We should reconsider this sidedata → 0 sidata_offset policy.

1875

# We should reconsider this sidedata → 0 sidata_offset policy.

1876

# In the meantime, we need this.

1876

# In the meantime, we need this.

1877

while 0 <= rev:

1877

while 0 <= rev:

1878

e = self.index[rev]

1878

e = self.index[rev]

1879

if e[9] != 0:

1879

if e[9] != 0:

1880

return e[8] + e[9]

1880

return e[8] + e[9]

1881

rev -= 1

1881

rev -= 1

1882

return 0

1882

return 0

1883

1884

def flags(self, rev):

1884

def flags(self, rev):

1885

return self.index[rev][0] & 0xFFFF

1885

return self.index[rev][0] & 0xFFFF

1886

1887

def length(self, rev):

1887

def length(self, rev):

1888

return self.index[rev][1]

1888

return self.index[rev][1]

1889

1890

def sidedata_length(self, rev):

1890

def sidedata_length(self, rev):

1891

if not self.feature_config.has_side_data:

1891

if not self.feature_config.has_side_data:

1892

return 0

1892

return 0

1893

return self.index[rev][9]

1893

return self.index[rev][9]

1894

1895

def rawsize(self, rev):

1895

def rawsize(self, rev):

1896

"""return the length of the uncompressed text for a given revision"""

1896

"""return the length of the uncompressed text for a given revision"""

1897

l = self.index[rev][2]

1897

l = self.index[rev][2]

1898

if l >= 0:

1898

if l >= 0:

1899

return l

1899

return l

1900

1901

t = self.rawdata(rev)

1901

t = self.rawdata(rev)

1902

return len(t)

1902

return len(t)

1903

1904

def size(self, rev):

1904

def size(self, rev):

1905

"""length of non-raw text (processed by a "read" flag processor)"""

1905

"""length of non-raw text (processed by a "read" flag processor)"""

1906

# fast path: if no "read" flag processor could change the content,

1906

# fast path: if no "read" flag processor could change the content,

1907

# size is rawsize. note: ELLIPSIS is known to not change the content.

1907

# size is rawsize. note: ELLIPSIS is known to not change the content.

1908

flags = self.flags(rev)

1908

flags = self.flags(rev)

1909

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1909

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1910

return self.rawsize(rev)

1910

return self.rawsize(rev)

1911

1912

return len(self.revision(rev))

1912

return len(self.revision(rev))

1913

1914

def fast_rank(self, rev):

1914

def fast_rank(self, rev):

1915

"""Return the rank of a revision if already known, or None otherwise.

1915

"""Return the rank of a revision if already known, or None otherwise.

1916

1917

The rank of a revision is the size of the sub-graph it defines as a

1917

The rank of a revision is the size of the sub-graph it defines as a

1918

head. Equivalently, the rank of a revision `r` is the size of the set

1918

head. Equivalently, the rank of a revision `r` is the size of the set

1919

`ancestors(r)`, `r` included.

1919

`ancestors(r)`, `r` included.

1920

1921

This method returns the rank retrieved from the revlog in constant

1921

This method returns the rank retrieved from the revlog in constant

1922

time. It makes no attempt at computing unknown values for versions of

1922

time. It makes no attempt at computing unknown values for versions of

1923

the revlog which do not persist the rank.

1923

the revlog which do not persist the rank.

1924

"""

1924

"""

1925

rank = self.index[rev][ENTRY_RANK]

1925

rank = self.index[rev][ENTRY_RANK]

1926

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1926

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1927

return None

1927

return None

1928

if rev == nullrev:

1928

if rev == nullrev:

1929

return 0 # convention

1929

return 0 # convention

1930

return rank

1930

return rank

1931

1932

def chainbase(self, rev):

1932

def chainbase(self, rev):

1933

base = self._chainbasecache.get(rev)

1933

base = self._chainbasecache.get(rev)

1934

if base is not None:

1934

if base is not None:

1935

return base

1935

return base

1936

1937

index = self.index

1937

index = self.index

1938

iterrev = rev

1938

iterrev = rev

1939

base = index[iterrev][3]

1939

base = index[iterrev][3]

1940

while base != iterrev:

1940

while base != iterrev:

1941

iterrev = base

1941

iterrev = base

1942

base = index[iterrev][3]

1942

base = index[iterrev][3]

1943

1944

self._chainbasecache[rev] = base

1944

self._chainbasecache[rev] = base

1945

return base

1945

return base

1946

1947

def linkrev(self, rev):

1947

def linkrev(self, rev):

1948

return self.index[rev][4]

1948

return self.index[rev][4]

1949

1950

def parentrevs(self, rev):

1950

def parentrevs(self, rev):

1951

try:

1951

try:

1952

entry = self.index[rev]

1952

entry = self.index[rev]

1953

except IndexError:

1953

except IndexError:

1954

if rev == wdirrev:

1954

if rev == wdirrev:

1955

raise error.WdirUnsupported

1955

raise error.WdirUnsupported

1956

raise

1956

raise

1957

1958

if self.feature_config.canonical_parent_order and entry[5] == nullrev:

1958

if self.feature_config.canonical_parent_order and entry[5] == nullrev:

1959

return entry[6], entry[5]

1959

return entry[6], entry[5]

1960

else:

1960

else:

1961

return entry[5], entry[6]

1961

return entry[5], entry[6]

1962

1963

# fast parentrevs(rev) where rev isn't filtered

1963

# fast parentrevs(rev) where rev isn't filtered

1964

_uncheckedparentrevs = parentrevs

1964

_uncheckedparentrevs = parentrevs

1965

1966

def node(self, rev):

1966

def node(self, rev):

1967

try:

1967

try:

1968

return self.index[rev][7]

1968

return self.index[rev][7]

1969

except IndexError:

1969

except IndexError:

1970

if rev == wdirrev:

1970

if rev == wdirrev:

1971

raise error.WdirUnsupported

1971

raise error.WdirUnsupported

1972

raise

1972

raise

1973

1974

# Derived from index values.

1974

# Derived from index values.

1975

1976

def end(self, rev):

1976

def end(self, rev):

1977

return self.start(rev) + self.length(rev)

1977

return self.start(rev) + self.length(rev)

1978

1979

def parents(self, node):

1979

def parents(self, node):

1980

i = self.index

1980

i = self.index

1981

d = i[self.rev(node)]

1981

d = i[self.rev(node)]

1982

# inline node() to avoid function call overhead

1982

# inline node() to avoid function call overhead

1983

if self.feature_config.canonical_parent_order and d[5] == self.nullid:

1983

if self.feature_config.canonical_parent_order and d[5] == self.nullid:

1984

return i[d[6]][7], i[d[5]][7]

1984

return i[d[6]][7], i[d[5]][7]

1985

else:

1985

else:

1986

return i[d[5]][7], i[d[6]][7]

1986

return i[d[5]][7], i[d[6]][7]

1987

1988

def chainlen(self, rev):

1988

def chainlen(self, rev):

1989

return self._chaininfo(rev)[0]

1989

return self._chaininfo(rev)[0]

1990

1991

def _chaininfo(self, rev):

1991

def _chaininfo(self, rev):

1992

chaininfocache = self._chaininfocache

1992

chaininfocache = self._chaininfocache

1993

if rev in chaininfocache:

1993

if rev in chaininfocache:

1994

return chaininfocache[rev]

1994

return chaininfocache[rev]

1995

index = self.index

1995

index = self.index

1996

generaldelta = self.delta_config.general_delta

1996

generaldelta = self.delta_config.general_delta

1997

iterrev = rev

1997

iterrev = rev

1998

e = index[iterrev]

1998

e = index[iterrev]

1999

clen = 0

1999

clen = 0

2000

compresseddeltalen = 0

2000

compresseddeltalen = 0

2001

while iterrev != e[3]:

2001

while iterrev != e[3]:

2002

clen += 1

2002

clen += 1

2003

compresseddeltalen += e[1]

2003

compresseddeltalen += e[1]

2004

if generaldelta:

2004

if generaldelta:

2005

iterrev = e[3]

2005

iterrev = e[3]

2006

else:

2006

else:

2007

iterrev -= 1

2007

iterrev -= 1

2008

if iterrev in chaininfocache:

2008

if iterrev in chaininfocache:

2009

t = chaininfocache[iterrev]

2009

t = chaininfocache[iterrev]

2010

clen += t[0]

2010

clen += t[0]

2011

compresseddeltalen += t[1]

2011

compresseddeltalen += t[1]

2012

break

2012

break

2013

e = index[iterrev]

2013

e = index[iterrev]

2014

else:

2014

else:

2015

# Add text length of base since decompressing that also takes

2015

# Add text length of base since decompressing that also takes

2016

# work. For cache hits the length is already included.

2016

# work. For cache hits the length is already included.

2017

compresseddeltalen += e[1]

2017

compresseddeltalen += e[1]

2018

r = (clen, compresseddeltalen)

2018

r = (clen, compresseddeltalen)

2019

chaininfocache[rev] = r

2019

chaininfocache[rev] = r

2020

return r

2020

return r

2021

2022

def _deltachain(self, rev, stoprev=None):

2022

def _deltachain(self, rev, stoprev=None):

2023

return self._inner._deltachain(rev, stoprev=stoprev)

2023

return self._inner._deltachain(rev, stoprev=stoprev)

2024

2025

def ancestors(self, revs, stoprev=0, inclusive=False):

2025

def ancestors(self, revs, stoprev=0, inclusive=False):

2026

"""Generate the ancestors of 'revs' in reverse revision order.

2026

"""Generate the ancestors of 'revs' in reverse revision order.

2027

Does not generate revs lower than stoprev.

2027

Does not generate revs lower than stoprev.

2028

2029

See the documentation for ancestor.lazyancestors for more details."""

2029

See the documentation for ancestor.lazyancestors for more details."""

2030

2031

# first, make sure start revisions aren't filtered

2031

# first, make sure start revisions aren't filtered

2032

revs = list(revs)

2032

revs = list(revs)

2033

checkrev = self.node

2033

checkrev = self.node

2034

for r in revs:

2034

for r in revs:

2035

checkrev(r)

2035

checkrev(r)

2036

# and we're sure ancestors aren't filtered as well

2036

# and we're sure ancestors aren't filtered as well

2037

2038

if rustancestor is not None and self.index.rust_ext_compat:

2038

if rustancestor is not None and self.index.rust_ext_compat:

2039

lazyancestors = rustancestor.LazyAncestors

2039

lazyancestors = rustancestor.LazyAncestors

2040

arg = self.index

2040

arg = self.index

2041

else:

2041

else:

2042

lazyancestors = ancestor.lazyancestors

2042

lazyancestors = ancestor.lazyancestors

2043

arg = self._uncheckedparentrevs

2043

arg = self._uncheckedparentrevs

2044

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

2044

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

2045

2046

def descendants(self, revs):

2046

def descendants(self, revs):

2047

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

2047

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

2048

2049

def findcommonmissing(self, common=None, heads=None):

2049

def findcommonmissing(self, common=None, heads=None):

2050

"""Return a tuple of the ancestors of common and the ancestors of heads

2050

"""Return a tuple of the ancestors of common and the ancestors of heads

2051

that are not ancestors of common. In revset terminology, we return the

2051

that are not ancestors of common. In revset terminology, we return the

2052

tuple:

2052

tuple:

2053

2054

::common, (::heads) - (::common)

2054

::common, (::heads) - (::common)

2055

2056

The list is sorted by revision number, meaning it is

2056

The list is sorted by revision number, meaning it is

2057

topologically sorted.

2057

topologically sorted.

2058

2059

'heads' and 'common' are both lists of node IDs. If heads is

2059

'heads' and 'common' are both lists of node IDs. If heads is

2060

not supplied, uses all of the revlog's heads. If common is not

2060

not supplied, uses all of the revlog's heads. If common is not

2061

supplied, uses nullid."""

2061

supplied, uses nullid."""

2062

if common is None:

2062

if common is None:

2063

common = [self.nullid]

2063

common = [self.nullid]

2064

if heads is None:

2064

if heads is None:

2065

heads = self.heads()

2065

heads = self.heads()

2066

2067

common = [self.rev(n) for n in common]

2067

common = [self.rev(n) for n in common]

2068

heads = [self.rev(n) for n in heads]

2068

heads = [self.rev(n) for n in heads]

2069

2070

# we want the ancestors, but inclusive

2070

# we want the ancestors, but inclusive

2071

class lazyset:

2071

class lazyset:

2072

def __init__(self, lazyvalues):

2072

def __init__(self, lazyvalues):

2073

self.addedvalues = set()

2073

self.addedvalues = set()

2074

self.lazyvalues = lazyvalues

2074

self.lazyvalues = lazyvalues

2075

2076

def __contains__(self, value):

2076

def __contains__(self, value):

2077

return value in self.addedvalues or value in self.lazyvalues

2077

return value in self.addedvalues or value in self.lazyvalues

2078

2079

def __iter__(self):

2079

def __iter__(self):

2080

added = self.addedvalues

2080

added = self.addedvalues

2081

for r in added:

2081

for r in added:

2082

yield r

2082

yield r

2083

for r in self.lazyvalues:

2083

for r in self.lazyvalues:

2084

if not r in added:

2084

if not r in added:

2085

yield r

2085

yield r

2086

2087

def add(self, value):

2087

def add(self, value):

2088

self.addedvalues.add(value)

2088

self.addedvalues.add(value)

2089

2090

def update(self, values):

2090

def update(self, values):

2091

self.addedvalues.update(values)

2091

self.addedvalues.update(values)

2092

2093

has = lazyset(self.ancestors(common))

2093

has = lazyset(self.ancestors(common))

2094

has.add(nullrev)

2094

has.add(nullrev)

2095

has.update(common)

2095

has.update(common)

2096

2097

# take all ancestors from heads that aren't in has

2097

# take all ancestors from heads that aren't in has

2098

missing = set()

2098

missing = set()

2099

visit = collections.deque(r for r in heads if r not in has)

2099

visit = collections.deque(r for r in heads if r not in has)

2100

while visit:

2100

while visit:

2101

r = visit.popleft()

2101

r = visit.popleft()

2102

if r in missing:

2102

if r in missing:

2103

continue

2103

continue

2104

else:

2104

else:

2105

missing.add(r)

2105

missing.add(r)

2106

for p in self.parentrevs(r):

2106

for p in self.parentrevs(r):

2107

if p not in has:

2107

if p not in has:

2108

visit.append(p)

2108

visit.append(p)

2109

missing = list(missing)

2109

missing = list(missing)

2110

missing.sort()

2110

missing.sort()

2111

return has, [self.node(miss) for miss in missing]

2111

return has, [self.node(miss) for miss in missing]

2112

2113

def incrementalmissingrevs(self, common=None):

2113

def incrementalmissingrevs(self, common=None):

2114

"""Return an object that can be used to incrementally compute the

2114

"""Return an object that can be used to incrementally compute the

2115

revision numbers of the ancestors of arbitrary sets that are not

2115

revision numbers of the ancestors of arbitrary sets that are not

2116

ancestors of common. This is an ancestor.incrementalmissingancestors

2116

ancestors of common. This is an ancestor.incrementalmissingancestors

2117

object.

2117

object.

2118

2119

'common' is a list of revision numbers. If common is not supplied, uses

2119

'common' is a list of revision numbers. If common is not supplied, uses

2120

nullrev.

2120

nullrev.

2121

"""

2121

"""

2122

if common is None:

2122

if common is None:

2123

common = [nullrev]

2123

common = [nullrev]

2124

2125

if rustancestor is not None and self.index.rust_ext_compat:

2125

if rustancestor is not None and self.index.rust_ext_compat:

2126

return rustancestor.MissingAncestors(self.index, common)

2126

return rustancestor.MissingAncestors(self.index, common)

2127

return ancestor.incrementalmissingancestors(self.parentrevs, common)

2127

return ancestor.incrementalmissingancestors(self.parentrevs, common)

2128

2129

def findmissingrevs(self, common=None, heads=None):

2129

def findmissingrevs(self, common=None, heads=None):

2130

"""Return the revision numbers of the ancestors of heads that

2130

"""Return the revision numbers of the ancestors of heads that

2131

are not ancestors of common.

2131

are not ancestors of common.

2132

2133

More specifically, return a list of revision numbers corresponding to

2133

More specifically, return a list of revision numbers corresponding to

2134

nodes N such that every N satisfies the following constraints:

2134

nodes N such that every N satisfies the following constraints:

2135

2136

1. N is an ancestor of some node in 'heads'

2136

1. N is an ancestor of some node in 'heads'

2137

2. N is not an ancestor of any node in 'common'

2137

2. N is not an ancestor of any node in 'common'

2138

2139

The list is sorted by revision number, meaning it is

2139

The list is sorted by revision number, meaning it is

2140

topologically sorted.

2140

topologically sorted.

2141

2142

'heads' and 'common' are both lists of revision numbers. If heads is

2142

'heads' and 'common' are both lists of revision numbers. If heads is

2143

not supplied, uses all of the revlog's heads. If common is not

2143

not supplied, uses all of the revlog's heads. If common is not

2144

supplied, uses nullid."""

2144

supplied, uses nullid."""

2145

if common is None:

2145

if common is None:

2146

common = [nullrev]

2146

common = [nullrev]

2147

if heads is None:

2147

if heads is None:

2148

heads = self.headrevs()

2148

heads = self.headrevs()

2149

2150

inc = self.incrementalmissingrevs(common=common)

2150

inc = self.incrementalmissingrevs(common=common)

2151

return inc.missingancestors(heads)

2151

return inc.missingancestors(heads)

2152

2153

def findmissing(self, common=None, heads=None):

2153

def findmissing(self, common=None, heads=None):

2154

"""Return the ancestors of heads that are not ancestors of common.

2154

"""Return the ancestors of heads that are not ancestors of common.

2155

2156

More specifically, return a list of nodes N such that every N

2156

More specifically, return a list of nodes N such that every N

2157

satisfies the following constraints:

2157

satisfies the following constraints:

2158

2159

1. N is an ancestor of some node in 'heads'

2159

1. N is an ancestor of some node in 'heads'

2160

2. N is not an ancestor of any node in 'common'

2160

2. N is not an ancestor of any node in 'common'

2161

2162

The list is sorted by revision number, meaning it is

2162

The list is sorted by revision number, meaning it is

2163

topologically sorted.

2163

topologically sorted.

2164

2165

'heads' and 'common' are both lists of node IDs. If heads is

2165

'heads' and 'common' are both lists of node IDs. If heads is

2166

not supplied, uses all of the revlog's heads. If common is not

2166

not supplied, uses all of the revlog's heads. If common is not

2167

supplied, uses nullid."""

2167

supplied, uses nullid."""

2168

if common is None:

2168

if common is None:

2169

common = [self.nullid]

2169

common = [self.nullid]

2170

if heads is None:

2170

if heads is None:

2171

heads = self.heads()

2171

heads = self.heads()

2172

2173

common = [self.rev(n) for n in common]

2173

common = [self.rev(n) for n in common]

2174

heads = [self.rev(n) for n in heads]

2174

heads = [self.rev(n) for n in heads]

2175

2176

inc = self.incrementalmissingrevs(common=common)

2176

inc = self.incrementalmissingrevs(common=common)

2177

return [self.node(r) for r in inc.missingancestors(heads)]

2177

return [self.node(r) for r in inc.missingancestors(heads)]

2178

2179

def nodesbetween(self, roots=None, heads=None):

2179

def nodesbetween(self, roots=None, heads=None):

2180

"""Return a topological path from 'roots' to 'heads'.

2180

"""Return a topological path from 'roots' to 'heads'.

2181

2182

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

2182

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

2183

topologically sorted list of all nodes N that satisfy both of

2183

topologically sorted list of all nodes N that satisfy both of

2184

these constraints:

2184

these constraints:

2185

2186

1. N is a descendant of some node in 'roots'

2186

1. N is a descendant of some node in 'roots'

2187

2. N is an ancestor of some node in 'heads'

2187

2. N is an ancestor of some node in 'heads'

2188

2189

Every node is considered to be both a descendant and an ancestor

2189

Every node is considered to be both a descendant and an ancestor

2190

of itself, so every reachable node in 'roots' and 'heads' will be

2190

of itself, so every reachable node in 'roots' and 'heads' will be

2191

included in 'nodes'.

2191

included in 'nodes'.

2192

2193

'outroots' is the list of reachable nodes in 'roots', i.e., the

2193

'outroots' is the list of reachable nodes in 'roots', i.e., the

2194

subset of 'roots' that is returned in 'nodes'. Likewise,

2194

subset of 'roots' that is returned in 'nodes'. Likewise,

2195

'outheads' is the subset of 'heads' that is also in 'nodes'.

2195

'outheads' is the subset of 'heads' that is also in 'nodes'.

2196

2197

'roots' and 'heads' are both lists of node IDs. If 'roots' is

2197

'roots' and 'heads' are both lists of node IDs. If 'roots' is

2198

unspecified, uses nullid as the only root. If 'heads' is

2198

unspecified, uses nullid as the only root. If 'heads' is

2199

unspecified, uses list of all of the revlog's heads."""

2199

unspecified, uses list of all of the revlog's heads."""

2200

nonodes = ([], [], [])

2200

nonodes = ([], [], [])

2201

if roots is not None:

2201

if roots is not None:

2202

roots = list(roots)

2202

roots = list(roots)

2203

if not roots:

2203

if not roots:

2204

return nonodes

2204

return nonodes

2205

lowestrev = min([self.rev(n) for n in roots])

2205

lowestrev = min([self.rev(n) for n in roots])

2206

else:

2206

else:

2207

roots = [self.nullid] # Everybody's a descendant of nullid

2207

roots = [self.nullid] # Everybody's a descendant of nullid

2208

lowestrev = nullrev

2208

lowestrev = nullrev

2209

if (lowestrev == nullrev) and (heads is None):

2209

if (lowestrev == nullrev) and (heads is None):

2210

# We want _all_ the nodes!

2210

# We want _all_ the nodes!

2211

return (

2211

return (

2212

[self.node(r) for r in self],

2212

[self.node(r) for r in self],

2213

[self.nullid],

2213

[self.nullid],

2214

list(self.heads()),

2214

list(self.heads()),

2215

)

2215

)

2216

if heads is None:

2216

if heads is None:

2217

# All nodes are ancestors, so the latest ancestor is the last

2217

# All nodes are ancestors, so the latest ancestor is the last

2218

# node.

2218

# node.

2219

highestrev = len(self) - 1

2219

highestrev = len(self) - 1

2220

# Set ancestors to None to signal that every node is an ancestor.

2220

# Set ancestors to None to signal that every node is an ancestor.

2221

ancestors = None

2221

ancestors = None

2222

# Set heads to an empty dictionary for later discovery of heads

2222

# Set heads to an empty dictionary for later discovery of heads

2223

heads = {}

2223

heads = {}

2224

else:

2224

else:

2225

heads = list(heads)

2225

heads = list(heads)

2226

if not heads:

2226

if not heads:

2227

return nonodes

2227

return nonodes

2228

ancestors = set()

2228

ancestors = set()

2229

# Turn heads into a dictionary so we can remove 'fake' heads.

2229

# Turn heads into a dictionary so we can remove 'fake' heads.

2230

# Also, later we will be using it to filter out the heads we can't

2230

# Also, later we will be using it to filter out the heads we can't

2231

# find from roots.

2231

# find from roots.

2232

heads = dict.fromkeys(heads, False)

2232

heads = dict.fromkeys(heads, False)

2233

# Start at the top and keep marking parents until we're done.

2233

# Start at the top and keep marking parents until we're done.

2234

nodestotag = set(heads)

2234

nodestotag = set(heads)

2235

# Remember where the top was so we can use it as a limit later.

2235

# Remember where the top was so we can use it as a limit later.

2236

highestrev = max([self.rev(n) for n in nodestotag])

2236

highestrev = max([self.rev(n) for n in nodestotag])

2237

while nodestotag:

2237

while nodestotag:

2238

# grab a node to tag

2238

# grab a node to tag

2239

n = nodestotag.pop()

2239

n = nodestotag.pop()

2240

# Never tag nullid

2240

# Never tag nullid

2241

if n == self.nullid:

2241

if n == self.nullid:

2242

continue

2242

continue

2243

# A node's revision number represents its place in a

2243

# A node's revision number represents its place in a

2244

# topologically sorted list of nodes.

2244

# topologically sorted list of nodes.

2245

r = self.rev(n)

2245

r = self.rev(n)

2246

if r >= lowestrev:

2246

if r >= lowestrev:

2247

if n not in ancestors:

2247

if n not in ancestors:

2248

# If we are possibly a descendant of one of the roots

2248

# If we are possibly a descendant of one of the roots

2249

# and we haven't already been marked as an ancestor

2249

# and we haven't already been marked as an ancestor

2250

ancestors.add(n) # Mark as ancestor

2250

ancestors.add(n) # Mark as ancestor

2251

# Add non-nullid parents to list of nodes to tag.

2251

# Add non-nullid parents to list of nodes to tag.

2252

nodestotag.update(

2252

nodestotag.update(

2253

[p for p in self.parents(n) if p != self.nullid]

2253

[p for p in self.parents(n) if p != self.nullid]

2254

)

2254

)

2255

elif n in heads: # We've seen it before, is it a fake head?

2255

elif n in heads: # We've seen it before, is it a fake head?

2256

# So it is, real heads should not be the ancestors of

2256

# So it is, real heads should not be the ancestors of

2257

# any other heads.

2257

# any other heads.

2258

heads.pop(n)

2258

heads.pop(n)

2259

if not ancestors:

2259

if not ancestors:

2260

return nonodes

2260

return nonodes

2261

# Now that we have our set of ancestors, we want to remove any

2261

# Now that we have our set of ancestors, we want to remove any

2262

# roots that are not ancestors.

2262

# roots that are not ancestors.

2263

2264

# If one of the roots was nullid, everything is included anyway.

2264

# If one of the roots was nullid, everything is included anyway.

2265

if lowestrev > nullrev:

2265

if lowestrev > nullrev:

2266

# But, since we weren't, let's recompute the lowest rev to not

2266

# But, since we weren't, let's recompute the lowest rev to not

2267

# include roots that aren't ancestors.

2267

# include roots that aren't ancestors.

2268

2269

# Filter out roots that aren't ancestors of heads

2269

# Filter out roots that aren't ancestors of heads

2270

roots = [root for root in roots if root in ancestors]

2270

roots = [root for root in roots if root in ancestors]

2271

# Recompute the lowest revision

2271

# Recompute the lowest revision

2272

if roots:

2272

if roots:

2273

lowestrev = min([self.rev(root) for root in roots])

2273

lowestrev = min([self.rev(root) for root in roots])

2274

else:

2274

else:

2275

# No more roots? Return empty list

2275

# No more roots? Return empty list

2276

return nonodes

2276

return nonodes

2277

else:

2277

else:

2278

# We are descending from nullid, and don't need to care about

2278

# We are descending from nullid, and don't need to care about

2279

# any other roots.

2279

# any other roots.

2280

lowestrev = nullrev

2280

lowestrev = nullrev

2281

roots = [self.nullid]

2281

roots = [self.nullid]

2282

# Transform our roots list into a set.

2282

# Transform our roots list into a set.

2283

descendants = set(roots)

2283

descendants = set(roots)

2284

# Also, keep the original roots so we can filter out roots that aren't

2284

# Also, keep the original roots so we can filter out roots that aren't

2285

# 'real' roots (i.e. are descended from other roots).

2285

# 'real' roots (i.e. are descended from other roots).

2286

roots = descendants.copy()

2286

roots = descendants.copy()

2287

# Our topologically sorted list of output nodes.

2287

# Our topologically sorted list of output nodes.

2288

orderedout = []

2288

orderedout = []

2289

# Don't start at nullid since we don't want nullid in our output list,

2289

# Don't start at nullid since we don't want nullid in our output list,

2290

# and if nullid shows up in descendants, empty parents will look like

2290

# and if nullid shows up in descendants, empty parents will look like

2291

# they're descendants.

2291

# they're descendants.

2292

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

2292

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

2293

n = self.node(r)

2293

n = self.node(r)

2294

isdescendant = False

2294

isdescendant = False

2295

if lowestrev == nullrev: # Everybody is a descendant of nullid

2295

if lowestrev == nullrev: # Everybody is a descendant of nullid

2296

isdescendant = True

2296

isdescendant = True

2297

elif n in descendants:

2297

elif n in descendants:

2298

# n is already a descendant

2298

# n is already a descendant

2299

isdescendant = True

2299

isdescendant = True

2300

# This check only needs to be done here because all the roots

2300

# This check only needs to be done here because all the roots

2301

# will start being marked is descendants before the loop.

2301

# will start being marked is descendants before the loop.

2302

if n in roots:

2302

if n in roots:

2303

# If n was a root, check if it's a 'real' root.

2303

# If n was a root, check if it's a 'real' root.

2304

p = tuple(self.parents(n))

2304

p = tuple(self.parents(n))

2305

# If any of its parents are descendants, it's not a root.

2305

# If any of its parents are descendants, it's not a root.

2306

if (p[0] in descendants) or (p[1] in descendants):

2306

if (p[0] in descendants) or (p[1] in descendants):

2307

roots.remove(n)

2307

roots.remove(n)

2308

else:

2308

else:

2309

p = tuple(self.parents(n))

2309

p = tuple(self.parents(n))

2310

# A node is a descendant if either of its parents are

2310

# A node is a descendant if either of its parents are

2311

# descendants. (We seeded the dependents list with the roots

2311

# descendants. (We seeded the dependents list with the roots

2312

# up there, remember?)

2312

# up there, remember?)

2313

if (p[0] in descendants) or (p[1] in descendants):

2313

if (p[0] in descendants) or (p[1] in descendants):

2314

descendants.add(n)

2314

descendants.add(n)

2315

isdescendant = True

2315

isdescendant = True

2316

if isdescendant and ((ancestors is None) or (n in ancestors)):

2316

if isdescendant and ((ancestors is None) or (n in ancestors)):

2317

# Only include nodes that are both descendants and ancestors.

2317

# Only include nodes that are both descendants and ancestors.

2318

orderedout.append(n)

2318

orderedout.append(n)

2319

if (ancestors is not None) and (n in heads):

2319

if (ancestors is not None) and (n in heads):

2320

# We're trying to figure out which heads are reachable

2320

# We're trying to figure out which heads are reachable

2321

# from roots.

2321

# from roots.

2322

# Mark this head as having been reached

2322

# Mark this head as having been reached

2323

heads[n] = True

2323

heads[n] = True

2324

elif ancestors is None:

2324

elif ancestors is None:

2325

# Otherwise, we're trying to discover the heads.

2325

# Otherwise, we're trying to discover the heads.

2326

# Assume this is a head because if it isn't, the next step

2326

# Assume this is a head because if it isn't, the next step

2327

# will eventually remove it.

2327

# will eventually remove it.

2328

heads[n] = True

2328

heads[n] = True

2329

# But, obviously its parents aren't.

2329

# But, obviously its parents aren't.

2330

for p in self.parents(n):

2330

for p in self.parents(n):

2331

heads.pop(p, None)

2331

heads.pop(p, None)

2332

heads = [head for head, flag in heads.items() if flag]

2332

heads = [head for head, flag in heads.items() if flag]

2333

roots = list(roots)

2333

roots = list(roots)

2334

assert orderedout

2334

assert orderedout

2335

assert roots

2335

assert roots

2336

assert heads

2336

assert heads

2337

return (orderedout, roots, heads)

2337

return (orderedout, roots, heads)

2338

2339

def headrevs(self, revs=None):

2339

def headrevs(self, revs=None):

2340

if revs is None:

2340

if revs is None:

2341

try:

2341

try:

2342

return self.index.headrevs()

2342

return self.index.headrevs()

2343

except AttributeError:

2343

except AttributeError:

2344

return self._headrevs()

2344

return self._headrevs()

2345

if rustdagop is not None and self.index.rust_ext_compat:

2345

if rustdagop is not None and self.index.rust_ext_compat:

2346

return rustdagop.headrevs(self.index, revs)

2346

return rustdagop.headrevs(self.index, revs)

2347

return dagop.headrevs(revs, self._uncheckedparentrevs)

2347

return dagop.headrevs(revs, self._uncheckedparentrevs)

2348

2349

def computephases(self, roots):

2349

def computephases(self, roots):

2350

return self.index.computephasesmapsets(roots)

2350

return self.index.computephasesmapsets(roots)

2351

2352

def _headrevs(self):

2352

def _headrevs(self):

2353

count = len(self)

2353

count = len(self)

2354

if not count:

2354

if not count:

2355

return [nullrev]

2355

return [nullrev]

2356

# we won't iter over filtered rev so nobody is a head at start

2356

# we won't iter over filtered rev so nobody is a head at start

2357

ishead = [0] * (count + 1)

2357

ishead = [0] * (count + 1)

2358

index = self.index

2358

index = self.index

2359

for r in self:

2359

for r in self:

2360

ishead[r] = 1 # I may be an head

2360

ishead[r] = 1 # I may be an head

2361

e = index[r]

2361

e = index[r]

2362

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

2362

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

2363

return [r for r, val in enumerate(ishead) if val]

2363

return [r for r, val in enumerate(ishead) if val]

2364

2365

def heads(self, start=None, stop=None):

2365

def heads(self, start=None, stop=None):

2366

"""return the list of all nodes that have no children

2366

"""return the list of all nodes that have no children

2367

2368

if start is specified, only heads that are descendants of

2368

if start is specified, only heads that are descendants of

2369

start will be returned

2369

start will be returned

2370

if stop is specified, it will consider all the revs from stop

2370

if stop is specified, it will consider all the revs from stop

2371

as if they had no children

2371

as if they had no children

2372

"""

2372

"""

2373

if start is None and stop is None:

2373

if start is None and stop is None:

2374

if not len(self):

2374

if not len(self):

2375

return [self.nullid]

2375

return [self.nullid]

2376

return [self.node(r) for r in self.headrevs()]

2376

return [self.node(r) for r in self.headrevs()]

2377

2378

if start is None:

2378

if start is None:

2379

start = nullrev

2379

start = nullrev

2380

else:

2380

else:

2381

start = self.rev(start)

2381

start = self.rev(start)

2382

2383

stoprevs = {self.rev(n) for n in stop or []}

2383

stoprevs = {self.rev(n) for n in stop or []}

2384

2385

revs = dagop.headrevssubset(

2385

revs = dagop.headrevssubset(

2386

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

2386

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

2387

)

2387

)

2388

2389

return [self.node(rev) for rev in revs]

2389

return [self.node(rev) for rev in revs]

2390

2391

def children(self, node):

2391

def children(self, node):

2392

"""find the children of a given node"""

2392

"""find the children of a given node"""

2393

c = []

2393

c = []

2394

p = self.rev(node)

2394

p = self.rev(node)

2395

for r in self.revs(start=p + 1):

2395

for r in self.revs(start=p + 1):

2396

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

2396

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

2397

if prevs:

2397

if prevs:

2398

for pr in prevs:

2398

for pr in prevs:

2399

if pr == p:

2399

if pr == p:

2400

c.append(self.node(r))

2400

c.append(self.node(r))

2401

elif p == nullrev:

2401

elif p == nullrev:

2402

c.append(self.node(r))

2402

c.append(self.node(r))

2403

return c

2403

return c

2404

2405

def commonancestorsheads(self, a, b):

2405

def commonancestorsheads(self, a, b):

2406

"""calculate all the heads of the common ancestors of nodes a and b"""

2406

"""calculate all the heads of the common ancestors of nodes a and b"""

2407

a, b = self.rev(a), self.rev(b)

2407

a, b = self.rev(a), self.rev(b)

2408

ancs = self._commonancestorsheads(a, b)

2408

ancs = self._commonancestorsheads(a, b)

2409

return pycompat.maplist(self.node, ancs)

2409

return pycompat.maplist(self.node, ancs)

2410

2411

def _commonancestorsheads(self, *revs):

2411

def _commonancestorsheads(self, *revs):

2412

"""calculate all the heads of the common ancestors of revs"""

2412

"""calculate all the heads of the common ancestors of revs"""

2413

try:

2413

try:

2414

ancs = self.index.commonancestorsheads(*revs)

2414

ancs = self.index.commonancestorsheads(*revs)

2415

except (AttributeError, OverflowError): # C implementation failed

2415

except (AttributeError, OverflowError): # C implementation failed

2416

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

2416

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

2417

return ancs

2417

return ancs

2418

2419

def isancestor(self, a, b):

2419

def isancestor(self, a, b):

2420

"""return True if node a is an ancestor of node b

2420

"""return True if node a is an ancestor of node b

2421

2422

A revision is considered an ancestor of itself."""

2422

A revision is considered an ancestor of itself."""

2423

a, b = self.rev(a), self.rev(b)

2423

a, b = self.rev(a), self.rev(b)

2424

return self.isancestorrev(a, b)

2424

return self.isancestorrev(a, b)

2425

2426

def isancestorrev(self, a, b):

2426

def isancestorrev(self, a, b):

2427

"""return True if revision a is an ancestor of revision b

2427

"""return True if revision a is an ancestor of revision b

2428

2429

A revision is considered an ancestor of itself.

2429

A revision is considered an ancestor of itself.

2430

2431

The implementation of this is trivial but the use of

2431

The implementation of this is trivial but the use of

2432

reachableroots is not."""

2432

reachableroots is not."""

2433

if a == nullrev:

2433

if a == nullrev:

2434

return True

2434

return True

2435

elif a == b:

2435

elif a == b:

2436

return True

2436

return True

2437

elif a > b:

2437

elif a > b:

2438

return False

2438

return False

2439

return bool(self.reachableroots(a, [b], [a], includepath=False))

2439

return bool(self.reachableroots(a, [b], [a], includepath=False))

2440

2441

def reachableroots(self, minroot, heads, roots, includepath=False):

2441

def reachableroots(self, minroot, heads, roots, includepath=False):

2442

"""return (heads(::(<roots> and <roots>::<heads>)))

2442

"""return (heads(::(<roots> and <roots>::<heads>)))

2443

2444

If includepath is True, return (<roots>::<heads>)."""

2444

If includepath is True, return (<roots>::<heads>)."""

2445

try:

2445

try:

2446

return self.index.reachableroots2(

2446

return self.index.reachableroots2(

2447

minroot, heads, roots, includepath

2447

minroot, heads, roots, includepath

2448

)

2448

)

2449

except AttributeError:

2449

except AttributeError:

2450

return dagop._reachablerootspure(

2450

return dagop._reachablerootspure(

2451

self.parentrevs, minroot, roots, heads, includepath

2451

self.parentrevs, minroot, roots, heads, includepath

2452

)

2452

)

2453

2454

def ancestor(self, a, b):

2454

def ancestor(self, a, b):

2455

"""calculate the "best" common ancestor of nodes a and b"""

2455

"""calculate the "best" common ancestor of nodes a and b"""

2456

2457

a, b = self.rev(a), self.rev(b)

2457

a, b = self.rev(a), self.rev(b)

2458

try:

2458

try:

2459

ancs = self.index.ancestors(a, b)

2459

ancs = self.index.ancestors(a, b)

2460

except (AttributeError, OverflowError):

2460

except (AttributeError, OverflowError):

2461

ancs = ancestor.ancestors(self.parentrevs, a, b)

2461

ancs = ancestor.ancestors(self.parentrevs, a, b)

2462

if ancs:

2462

if ancs:

2463

# choose a consistent winner when there's a tie

2463

# choose a consistent winner when there's a tie

2464

return min(map(self.node, ancs))

2464

return min(map(self.node, ancs))

2465

return self.nullid

2465

return self.nullid

2466

2467

def _match(self, id):

2467

def _match(self, id):

2468

if isinstance(id, int):

2468

if isinstance(id, int):

2469

# rev

2469

# rev

2470

return self.node(id)

2470

return self.node(id)

2471

if len(id) == self.nodeconstants.nodelen:

2471

if len(id) == self.nodeconstants.nodelen:

2472

# possibly a binary node

2472

# possibly a binary node

2473

# odds of a binary node being all hex in ASCII are 1 in 10**25

2473

# odds of a binary node being all hex in ASCII are 1 in 10**25

2474

try:

2474

try:

2475

node = id

2475

node = id

2476

self.rev(node) # quick search the index

2476

self.rev(node) # quick search the index

2477

return node

2477

return node

2478

except error.LookupError:

2478

except error.LookupError:

2479

pass # may be partial hex id

2479

pass # may be partial hex id

2480

try:

2480

try:

2481

# str(rev)

2481

# str(rev)

2482

rev = int(id)

2482

rev = int(id)

2483

if b"%d" % rev != id:

2483

if b"%d" % rev != id:

2484

raise ValueError

2484

raise ValueError

2485

if rev < 0:

2485

if rev < 0:

2486

rev = len(self) + rev

2486

rev = len(self) + rev

2487

if rev < 0 or rev >= len(self):

2487

if rev < 0 or rev >= len(self):

2488

raise ValueError

2488

raise ValueError

2489

return self.node(rev)

2489

return self.node(rev)

2490

except (ValueError, OverflowError):

2490

except (ValueError, OverflowError):

2491

pass

2491

pass

2492

if len(id) == 2 * self.nodeconstants.nodelen:

2492

if len(id) == 2 * self.nodeconstants.nodelen:

2493

try:

2493

try:

2494

# a full hex nodeid?

2494

# a full hex nodeid?

2495

node = bin(id)

2495

node = bin(id)

2496

self.rev(node)

2496

self.rev(node)

2497

return node

2497

return node

2498

except (binascii.Error, error.LookupError):

2498

except (binascii.Error, error.LookupError):

2499

pass

2499

pass

2500

2501

def _partialmatch(self, id):

2501

def _partialmatch(self, id):

2502

# we don't care wdirfilenodeids as they should be always full hash

2502

# we don't care wdirfilenodeids as they should be always full hash

2503

maybewdir = self.nodeconstants.wdirhex.startswith(id)

2503

maybewdir = self.nodeconstants.wdirhex.startswith(id)

2504

ambiguous = False

2504

ambiguous = False

2505

try:

2505

try:

2506

partial = self.index.partialmatch(id)

2506

partial = self.index.partialmatch(id)

2507

if partial and self.hasnode(partial):

2507

if partial and self.hasnode(partial):

2508

if maybewdir:

2508

if maybewdir:

2509

# single 'ff...' match in radix tree, ambiguous with wdir

2509

# single 'ff...' match in radix tree, ambiguous with wdir

2510

ambiguous = True

2510

ambiguous = True

2511

else:

2511

else:

2512

return partial

2512

return partial

2513

elif maybewdir:

2513

elif maybewdir:

2514

# no 'ff...' match in radix tree, wdir identified

2514

# no 'ff...' match in radix tree, wdir identified

2515

raise error.WdirUnsupported

2515

raise error.WdirUnsupported

2516

else:

2516

else:

2517

return None

2517

return None

2518

except error.RevlogError:

2518

except error.RevlogError:

2519

# parsers.c radix tree lookup gave multiple matches

2519

# parsers.c radix tree lookup gave multiple matches

2520

# fast path: for unfiltered changelog, radix tree is accurate

2520

# fast path: for unfiltered changelog, radix tree is accurate

2521

if not getattr(self, 'filteredrevs', None):

2521

if not getattr(self, 'filteredrevs', None):

2522

ambiguous = True

2522

ambiguous = True

2523

# fall through to slow path that filters hidden revisions

2523

# fall through to slow path that filters hidden revisions

2524

except (AttributeError, ValueError):

2524

except (AttributeError, ValueError):

2525

# we are pure python, or key is not hex

2525

# we are pure python, or key is not hex

2526

pass

2526

pass

2527

if ambiguous:

2527

if ambiguous:

2528

raise error.AmbiguousPrefixLookupError(

2528

raise error.AmbiguousPrefixLookupError(

2529

id, self.display_id, _(b'ambiguous identifier')

2529

id, self.display_id, _(b'ambiguous identifier')

2530

)

2530

)

2531

2532

if id in self._pcache:

2532

if id in self._pcache:

2533

return self._pcache[id]

2533

return self._pcache[id]

2534

2535

if len(id) <= 40:

2535

if len(id) <= 40:

2536

# hex(node)[:...]

2536

# hex(node)[:...]

2537

l = len(id) // 2 * 2 # grab an even number of digits

2537

l = len(id) // 2 * 2 # grab an even number of digits

2538

try:

2538

try:

2539

# we're dropping the last digit, so let's check that it's hex,

2539

# we're dropping the last digit, so let's check that it's hex,

2540

# to avoid the expensive computation below if it's not

2540

# to avoid the expensive computation below if it's not

2541

if len(id) % 2 > 0:

2541

if len(id) % 2 > 0:

2542

if not (id[-1] in hexdigits):

2542

if not (id[-1] in hexdigits):

2543

return None

2543

return None

2544

prefix = bin(id[:l])

2544

prefix = bin(id[:l])

2545

except binascii.Error:

2545

except binascii.Error:

2546

pass

2546

pass

2547

else:

2547

else:

2548

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

2548

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

2549

nl = [

2549

nl = [

2550

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

2550

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

2551

]

2551

]

2552

if self.nodeconstants.nullhex.startswith(id):

2552

if self.nodeconstants.nullhex.startswith(id):

2553

nl.append(self.nullid)

2553

nl.append(self.nullid)

2554

if len(nl) > 0:

2554

if len(nl) > 0:

2555

if len(nl) == 1 and not maybewdir:

2555

if len(nl) == 1 and not maybewdir:

2556

self._pcache[id] = nl[0]

2556

self._pcache[id] = nl[0]

2557

return nl[0]

2557

return nl[0]

2558

raise error.AmbiguousPrefixLookupError(

2558

raise error.AmbiguousPrefixLookupError(

2559

id, self.display_id, _(b'ambiguous identifier')

2559

id, self.display_id, _(b'ambiguous identifier')

2560

)

2560

)

2561

if maybewdir:

2561

if maybewdir:

2562

raise error.WdirUnsupported

2562

raise error.WdirUnsupported

2563

return None

2563

return None

2564

2565

def lookup(self, id):

2565

def lookup(self, id):

2566

"""locate a node based on:

2566

"""locate a node based on:

2567

- revision number or str(revision number)

2567

- revision number or str(revision number)

2568

- nodeid or subset of hex nodeid

2568

- nodeid or subset of hex nodeid

2569

"""

2569

"""

2570

n = self._match(id)

2570

n = self._match(id)

2571

if n is not None:

2571

if n is not None:

2572

return n

2572

return n

2573

n = self._partialmatch(id)

2573

n = self._partialmatch(id)

2574

if n:

2574

if n:

2575

return n

2575

return n

2576

2577

raise error.LookupError(id, self.display_id, _(b'no match found'))

2577

raise error.LookupError(id, self.display_id, _(b'no match found'))

2578

2579

def shortest(self, node, minlength=1):

2579

def shortest(self, node, minlength=1):

2580

"""Find the shortest unambiguous prefix that matches node."""

2580

"""Find the shortest unambiguous prefix that matches node."""

2581

2582

def isvalid(prefix):

2582

def isvalid(prefix):

2583

try:

2583

try:

2584

matchednode = self._partialmatch(prefix)

2584

matchednode = self._partialmatch(prefix)

2585

except error.AmbiguousPrefixLookupError:

2585

except error.AmbiguousPrefixLookupError:

2586

return False

2586

return False

2587

except error.WdirUnsupported:

2587

except error.WdirUnsupported:

2588

# single 'ff...' match

2588

# single 'ff...' match

2589

return True

2589

return True

2590

if matchednode is None:

2590

if matchednode is None:

2591

raise error.LookupError(node, self.display_id, _(b'no node'))

2591

raise error.LookupError(node, self.display_id, _(b'no node'))

2592

return True

2592

return True

2593

2594

def maybewdir(prefix):

2594

def maybewdir(prefix):

2595

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

2595

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

2596

2597

hexnode = hex(node)

2597

hexnode = hex(node)

2598

2599

def disambiguate(hexnode, minlength):

2599

def disambiguate(hexnode, minlength):

2600

"""Disambiguate against wdirid."""

2600

"""Disambiguate against wdirid."""

2601

for length in range(minlength, len(hexnode) + 1):

2601

for length in range(minlength, len(hexnode) + 1):

2602

prefix = hexnode[:length]

2602

prefix = hexnode[:length]

2603

if not maybewdir(prefix):

2603

if not maybewdir(prefix):

2604

return prefix

2604

return prefix

2605

2606

if not getattr(self, 'filteredrevs', None):

2606

if not getattr(self, 'filteredrevs', None):

2607

try:

2607

try:

2608

length = max(self.index.shortest(node), minlength)

2608

length = max(self.index.shortest(node), minlength)

2609

return disambiguate(hexnode, length)

2609

return disambiguate(hexnode, length)

2610

except error.RevlogError:

2610

except error.RevlogError:

2611

if node != self.nodeconstants.wdirid:

2611

if node != self.nodeconstants.wdirid:

2612

raise error.LookupError(

2612

raise error.LookupError(

2613

node, self.display_id, _(b'no node')

2613

node, self.display_id, _(b'no node')

2614

)

2614

)

2615

except AttributeError:

2615

except AttributeError:

2616

# Fall through to pure code

2616

# Fall through to pure code

2617

pass

2617

pass

2618

2619

if node == self.nodeconstants.wdirid:

2619

if node == self.nodeconstants.wdirid:

2620

for length in range(minlength, len(hexnode) + 1):

2620

for length in range(minlength, len(hexnode) + 1):

2621

prefix = hexnode[:length]

2621

prefix = hexnode[:length]

2622

if isvalid(prefix):

2622

if isvalid(prefix):

2623

return prefix

2623

return prefix

2624

2625

for length in range(minlength, len(hexnode) + 1):

2625

for length in range(minlength, len(hexnode) + 1):

2626

prefix = hexnode[:length]

2626

prefix = hexnode[:length]

2627

if isvalid(prefix):

2627

if isvalid(prefix):

2628

return disambiguate(hexnode, length)

2628

return disambiguate(hexnode, length)

2629

2630

def cmp(self, node, text):

2630

def cmp(self, node, text):

2631

"""compare text with a given file revision

2631

"""compare text with a given file revision

2632

2633

returns True if text is different than what is stored.

2633

returns True if text is different than what is stored.

2634

"""

2634

"""

2635

p1, p2 = self.parents(node)

2635

p1, p2 = self.parents(node)

2636

return storageutil.hashrevisionsha1(text, p1, p2) != node

2636

return storageutil.hashrevisionsha1(text, p1, p2) != node

2637

2638

def deltaparent(self, rev):

2638

def deltaparent(self, rev):

2639

"""return deltaparent of the given revision"""

2639

"""return deltaparent of the given revision"""

2640

base = self.index[rev][3]

2640

base = self.index[rev][3]

2641

if base == rev:

2641

if base == rev:

2642

return nullrev

2642

return nullrev

2643

elif self.delta_config.general_delta:

2643

elif self.delta_config.general_delta:

2644

return base

2644

return base

2645

else:

2645

else:

2646

return rev - 1

2646

return rev - 1

2647

2648

def issnapshot(self, rev):

2648

def issnapshot(self, rev):

2649

"""tells whether rev is a snapshot"""

2649

"""tells whether rev is a snapshot"""

2650

ret = self._inner.issnapshot(rev)

2650

ret = self._inner.issnapshot(rev)

2651

self.issnapshot = self._inner.issnapshot

2651

self.issnapshot = self._inner.issnapshot

2652

return ret

2652

return ret

2653

2654

def snapshotdepth(self, rev):

2654

def snapshotdepth(self, rev):

2655

"""number of snapshot in the chain before this one"""

2655

"""number of snapshot in the chain before this one"""

2656

if not self.issnapshot(rev):

2656

if not self.issnapshot(rev):

2657

raise error.ProgrammingError(b'revision %d not a snapshot')

2657

raise error.ProgrammingError(b'revision %d not a snapshot')

2658

return len(self._inner._deltachain(rev)[0]) - 1

2658

return len(self._inner._deltachain(rev)[0]) - 1

2659

2660

def revdiff(self, rev1, rev2):

2660

def revdiff(self, rev1, rev2):

2661

"""return or calculate a delta between two revisions

2661

"""return or calculate a delta between two revisions

2662

2663

The delta calculated is in binary form and is intended to be written to

2663

The delta calculated is in binary form and is intended to be written to

2664

revlog data directly. So this function needs raw revision data.

2664

revlog data directly. So this function needs raw revision data.

2665

"""

2665

"""

2666

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2666

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2667

return bytes(self._inner._chunk(rev2))

2667

return bytes(self._inner._chunk(rev2))

2668

2669

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2669

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2670

2671

def revision(self, nodeorrev):

2671

def revision(self, nodeorrev):

2672

"""return an uncompressed revision of a given node or revision

2672

"""return an uncompressed revision of a given node or revision

2673

number.

2673

number.

2674

"""

2674

"""

2675

return self._revisiondata(nodeorrev)

2675

return self._revisiondata(nodeorrev)

2676

2677

def sidedata(self, nodeorrev):

2677

def sidedata(self, nodeorrev):

2678

"""a map of extra data related to the changeset but not part of the hash

2678

"""a map of extra data related to the changeset but not part of the hash

2679

2680

This function currently return a dictionary. However, more advanced

2680

This function currently return a dictionary. However, more advanced

2681

mapping object will likely be used in the future for a more

2681

mapping object will likely be used in the future for a more

2682

efficient/lazy code.

2682

efficient/lazy code.

2683

"""

2683

"""

2684

# deal with <nodeorrev> argument type

2684

# deal with <nodeorrev> argument type

2685

if isinstance(nodeorrev, int):

2685

if isinstance(nodeorrev, int):

2686

rev = nodeorrev

2686

rev = nodeorrev

2687

else:

2687

else:

2688

rev = self.rev(nodeorrev)

2688

rev = self.rev(nodeorrev)

2689

return self._sidedata(rev)

2689

return self._sidedata(rev)

2690

2691

def _rawtext(self, node, rev):

2691

def _rawtext(self, node, rev):

2692

"""return the possibly unvalidated rawtext for a revision

2692

"""return the possibly unvalidated rawtext for a revision

2693

2694

returns (rev, rawtext, validated)

2694

returns (rev, rawtext, validated)

2695

"""

2695

"""

2696

# Check if we have the entry in cache

2696

# Check if we have the entry in cache

2697

# The cache entry looks like (node, rev, rawtext)

2697

# The cache entry looks like (node, rev, rawtext)

2698

if self._inner._revisioncache:

2698

if self._inner._revisioncache:

2699

if self._inner._revisioncache[0] == node:

2699

if self._inner._revisioncache[0] == node:

2700

return (rev, self._inner._revisioncache[2], True)

2700

return (rev, self._inner._revisioncache[2], True)

2701

2702

if rev is None:

2702

if rev is None:

2703

rev = self.rev(node)

2703

rev = self.rev(node)

2704

2705

return self._inner.raw_text(node, rev)

2705

return self._inner.raw_text(node, rev)

2706

2707

def _revisiondata(self, nodeorrev, raw=False):

2707

def _revisiondata(self, nodeorrev, raw=False):

2708

# deal with <nodeorrev> argument type

2708

# deal with <nodeorrev> argument type

2709

if isinstance(nodeorrev, int):

2709

if isinstance(nodeorrev, int):

2710

rev = nodeorrev

2710

rev = nodeorrev

2711

node = self.node(rev)

2711

node = self.node(rev)

2712

else:

2712

else:

2713

node = nodeorrev

2713

node = nodeorrev

2714

rev = None

2714

rev = None

2715

2716

# fast path the special `nullid` rev

2716

# fast path the special `nullid` rev

2717

if node == self.nullid:

2717

if node == self.nullid:

2718

return b""

2718

return b""

2719

2720

# ``rawtext`` is the text as stored inside the revlog. Might be the

2720

# ``rawtext`` is the text as stored inside the revlog. Might be the

2721

# revision or might need to be processed to retrieve the revision.

2721

# revision or might need to be processed to retrieve the revision.

2722

rev, rawtext, validated = self._rawtext(node, rev)

2722

rev, rawtext, validated = self._rawtext(node, rev)

2723

2724

if raw and validated:

2724

if raw and validated:

2725

# if we don't want to process the raw text and that raw

2725

# if we don't want to process the raw text and that raw

2726

# text is cached, we can exit early.

2726

# text is cached, we can exit early.

2727

return rawtext

2727

return rawtext

2728

if rev is None:

2728

if rev is None:

2729

rev = self.rev(node)

2729

rev = self.rev(node)

2730

# the revlog's flag for this revision

2730

# the revlog's flag for this revision

2731

# (usually alter its state or content)

2731

# (usually alter its state or content)

2732

flags = self.flags(rev)

2732

flags = self.flags(rev)

2733

2734

if validated and flags == REVIDX_DEFAULT_FLAGS:

2734

if validated and flags == REVIDX_DEFAULT_FLAGS:

2735

# no extra flags set, no flag processor runs, text = rawtext

2735

# no extra flags set, no flag processor runs, text = rawtext

2736

return rawtext

2736

return rawtext

2737

2738

if raw:

2738

if raw:

2739

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2739

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2740

text = rawtext

2740

text = rawtext

2741

else:

2741

else:

2742

r = flagutil.processflagsread(self, rawtext, flags)

2742

r = flagutil.processflagsread(self, rawtext, flags)

2743

text, validatehash = r

2743

text, validatehash = r

2744

if validatehash:

2744

if validatehash:

2745

self.checkhash(text, node, rev=rev)

2745

self.checkhash(text, node, rev=rev)

2746

if not validated:

2746

if not validated:

2747

self._inner._revisioncache = (node, rev, rawtext)

2747

self._inner._revisioncache = (node, rev, rawtext)

2748

2749

return text

2749

return text

2750

2751

def _sidedata(self, rev):

2751

def _sidedata(self, rev):

2752

"""Return the sidedata for a given revision number."""

2752

"""Return the sidedata for a given revision number."""

2753

sidedata_end = None

2753

sidedata_end = None

2754

if self._docket is not None:

2754

if self._docket is not None:

2755

sidedata_end = self._docket.sidedata_end

2755

sidedata_end = self._docket.sidedata_end

2756

return self._inner.sidedata(rev, sidedata_end)

2756

return self._inner.sidedata(rev, sidedata_end)

2757

2758

def rawdata(self, nodeorrev):

2758

def rawdata(self, nodeorrev):

2759

"""return an uncompressed raw data of a given node or revision number."""

2759

"""return an uncompressed raw data of a given node or revision number."""

2760

return self._revisiondata(nodeorrev, raw=True)

2760

return self._revisiondata(nodeorrev, raw=True)

2761

2762

def hash(self, text, p1, p2):

2762

def hash(self, text, p1, p2):

2763

"""Compute a node hash.

2763

"""Compute a node hash.

2764

2765

Available as a function so that subclasses can replace the hash

2765

Available as a function so that subclasses can replace the hash

2766

as needed.

2766

as needed.

2767

"""

2767

"""

2768

return storageutil.hashrevisionsha1(text, p1, p2)

2768

return storageutil.hashrevisionsha1(text, p1, p2)

2769

2770

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2770

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2771

"""Check node hash integrity.

2771

"""Check node hash integrity.

2772

2773

Available as a function so that subclasses can extend hash mismatch

2773

Available as a function so that subclasses can extend hash mismatch

2774

behaviors as needed.

2774

behaviors as needed.

2775

"""

2775

"""

2776

try:

2776

try:

2777

if p1 is None and p2 is None:

2777

if p1 is None and p2 is None:

2778

p1, p2 = self.parents(node)

2778

p1, p2 = self.parents(node)

2779

if node != self.hash(text, p1, p2):

2779

if node != self.hash(text, p1, p2):

2780

# Clear the revision cache on hash failure. The revision cache

2780

# Clear the revision cache on hash failure. The revision cache

2781

# only stores the raw revision and clearing the cache does have

2781

# only stores the raw revision and clearing the cache does have

2782

# the side-effect that we won't have a cache hit when the raw

2782

# the side-effect that we won't have a cache hit when the raw

2783

# revision data is accessed. But this case should be rare and

2783

# revision data is accessed. But this case should be rare and

2784

# it is extra work to teach the cache about the hash

2784

# it is extra work to teach the cache about the hash

2785

# verification state.

2785

# verification state.

2786

if (

2786

if (

2787

self._inner._revisioncache

2787

self._inner._revisioncache

2788

and self._inner._revisioncache[0] == node

2788

and self._inner._revisioncache[0] == node

2789

):

2789

):

2790

self._inner._revisioncache = None

2790

self._inner._revisioncache = None

2791

2792

revornode = rev

2792

revornode = rev

2793

if revornode is None:

2793

if revornode is None:

2794

revornode = templatefilters.short(hex(node))

2794

revornode = templatefilters.short(hex(node))

2795

raise error.RevlogError(

2795

raise error.RevlogError(

2796

_(b"integrity check failed on %s:%s")

2796

_(b"integrity check failed on %s:%s")

2797

% (self.display_id, pycompat.bytestr(revornode))

2797

% (self.display_id, pycompat.bytestr(revornode))

2798

)

2798

)

2799

except error.RevlogError:

2799

except error.RevlogError:

2800

if self.feature_config.censorable and storageutil.iscensoredtext(

2800

if self.feature_config.censorable and storageutil.iscensoredtext(

2801

text

2801

text

2802

):

2802

):

2803

raise error.CensoredNodeError(self.display_id, node, text)

2803

raise error.CensoredNodeError(self.display_id, node, text)

2804

raise

2804

raise

2805

2806

@property

2806

@property

2807

def _split_index_file(self):

2807

def _split_index_file(self):

2808

"""the path where to expect the index of an ongoing splitting operation

2808

"""the path where to expect the index of an ongoing splitting operation

2809

2810

The file will only exist if a splitting operation is in progress, but

2810

The file will only exist if a splitting operation is in progress, but

2811

it is always expected at the same location."""

2811

it is always expected at the same location."""

2812

parts = self.radix.split(b'/')

2812

parts = self.radix.split(b'/')

2813

if len(parts) > 1:

2813

if len(parts) > 1:

2814

# adds a '-s' prefix to the ``data/` or `meta/` base

2814

# adds a '-s' prefix to the ``data/` or `meta/` base

2815

head = parts[0] + b'-s'

2815

head = parts[0] + b'-s'

2816

mids = parts[1:-1]

2816

mids = parts[1:-1]

2817

tail = parts[-1] + b'.i'

2817

tail = parts[-1] + b'.i'

2818

pieces = [head] + mids + [tail]

2818

pieces = [head] + mids + [tail]

2819

return b'/'.join(pieces)

2819

return b'/'.join(pieces)

2820

else:

2820

else:

2821

# the revlog is stored at the root of the store (changelog or

2821

# the revlog is stored at the root of the store (changelog or

2822

# manifest), no risk of collision.

2822

# manifest), no risk of collision.

2823

return self.radix + b'.i.s'

2823

return self.radix + b'.i.s'

2824

2825

def _enforceinlinesize(self, tr, side_write=True):

2825

def _enforceinlinesize(self, tr, side_write=True):

2826

"""Check if the revlog is too big for inline and convert if so.

2826

"""Check if the revlog is too big for inline and convert if so.

2827

2828

This should be called after revisions are added to the revlog. If the

2828

This should be called after revisions are added to the revlog. If the

2829

revlog has grown too large to be an inline revlog, it will convert it

2829

revlog has grown too large to be an inline revlog, it will convert it

2830

to use multiple index and data files.

2830

to use multiple index and data files.

2831

"""

2831

"""

2832

tiprev = len(self) - 1

2832

tiprev = len(self) - 1

2833

total_size = self.start(tiprev) + self.length(tiprev)

2833

total_size = self.start(tiprev) + self.length(tiprev)

2834

if not self._inline or (self._may_inline and total_size < _maxinline):

2834

if not self._inline or (self._may_inline and total_size < _maxinline):

2835

return

2835

return

2836

2837

if self._docket is not None:

2837

if self._docket is not None:

2838

msg = b"inline revlog should not have a docket"

2838

msg = b"inline revlog should not have a docket"

2839

raise error.ProgrammingError(msg)

2839

raise error.ProgrammingError(msg)

2840

2841

# In the common case, we enforce inline size because the revlog has

2841

# In the common case, we enforce inline size because the revlog has

2842

# been appened too. And in such case, it must have an initial offset

2842

# been appened too. And in such case, it must have an initial offset

2843

# recorded in the transaction.

2843

# recorded in the transaction.

2844

troffset = tr.findoffset(self._inner.canonical_index_file)

2844

troffset = tr.findoffset(self._inner.canonical_index_file)

2845

pre_touched = troffset is not None

2845

pre_touched = troffset is not None

2846

if not pre_touched and self.target[0] != KIND_CHANGELOG:

2846

if not pre_touched and self.target[0] != KIND_CHANGELOG:

2847

raise error.RevlogError(

2847

raise error.RevlogError(

2848

_(b"%s not found in the transaction") % self._indexfile

2848

_(b"%s not found in the transaction") % self._indexfile

2849

)

2849

)

2850

2851

tr.addbackup(self._inner.canonical_index_file, for_offset=pre_touched)

2851

tr.addbackup(self._inner.canonical_index_file, for_offset=pre_touched)

2852

tr.add(self._datafile, 0)

2852

tr.add(self._datafile, 0)

2853

2854

new_index_file_path = None

2854

new_index_file_path = None

2855

if side_write:

2855

if side_write:

2856

old_index_file_path = self._indexfile

2856

old_index_file_path = self._indexfile

2857

new_index_file_path = self._split_index_file

2857

new_index_file_path = self._split_index_file

2858

opener = self.opener

2858

opener = self.opener

2859

weak_self = weakref.ref(self)

2859

weak_self = weakref.ref(self)

2860

2861

# the "split" index replace the real index when the transaction is

2861

# the "split" index replace the real index when the transaction is

2862

# finalized

2862

# finalized

2863

def finalize_callback(tr):

2863

def finalize_callback(tr):

2864

opener.rename(

2864

opener.rename(

2865

new_index_file_path,

2865

new_index_file_path,

2866

old_index_file_path,

2866

old_index_file_path,

2867

checkambig=True,

2867

checkambig=True,

2868

)

2868

)

2869

maybe_self = weak_self()

2869

maybe_self = weak_self()

2870

if maybe_self is not None:

2870

if maybe_self is not None:

2871

maybe_self._indexfile = old_index_file_path

2871

maybe_self._indexfile = old_index_file_path

2872

maybe_self._inner.index_file = maybe_self._indexfile

2872

maybe_self._inner.index_file = maybe_self._indexfile

2873

2874

def abort_callback(tr):

2874

def abort_callback(tr):

2875

maybe_self = weak_self()

2875

maybe_self = weak_self()

2876

if maybe_self is not None:

2876

if maybe_self is not None:

2877

maybe_self._indexfile = old_index_file_path

2877

maybe_self._indexfile = old_index_file_path

2878

maybe_self._inner.inline = True

2878

maybe_self._inner.inline = True

2879

maybe_self._inner.index_file = old_index_file_path

2879

maybe_self._inner.index_file = old_index_file_path

2880

2881

tr.registertmp(new_index_file_path)

2881

tr.registertmp(new_index_file_path)

2882

if self.target[1] is not None:

2882

if self.target[1] is not None:

2883

callback_id = b'000-revlog-split-%d-%s' % self.target

2883

callback_id = b'000-revlog-split-%d-%s' % self.target

2884

else:

2884

else:

2885

callback_id = b'000-revlog-split-%d' % self.target[0]

2885

callback_id = b'000-revlog-split-%d' % self.target[0]

2886

tr.addfinalize(callback_id, finalize_callback)

2886

tr.addfinalize(callback_id, finalize_callback)

2887

tr.addabort(callback_id, abort_callback)

2887

tr.addabort(callback_id, abort_callback)

2888

2889

self._format_flags &= ~FLAG_INLINE_DATA

2889

self._format_flags &= ~FLAG_INLINE_DATA

2890

self._inner.split_inline(

2890

self._inner.split_inline(

2891

tr,

2891

tr,

2892

self._format_flags | self._format_version,

2892

self._format_flags | self._format_version,

2893

new_index_file_path=new_index_file_path,

2893

new_index_file_path=new_index_file_path,

2894

)

2894

)

2895

2896

self._inline = False

2896

self._inline = False

2897

if new_index_file_path is not None:

2897

if new_index_file_path is not None:

2898

self._indexfile = new_index_file_path

2898

self._indexfile = new_index_file_path

2899

2900

nodemaputil.setup_persistent_nodemap(tr, self)

2900

nodemaputil.setup_persistent_nodemap(tr, self)

2901

2902

def _nodeduplicatecallback(self, transaction, node):

2902

def _nodeduplicatecallback(self, transaction, node):

2903

"""called when trying to add a node already stored."""

2903

"""called when trying to add a node already stored."""

2904

2905

@contextlib.contextmanager

2905

@contextlib.contextmanager

2906

def reading(self):

2906

def reading(self):

2907

with self._inner.reading():

2907

with self._inner.reading():

2908

yield

2908

yield

2909

2910

@contextlib.contextmanager

2910

@contextlib.contextmanager

2911

def _writing(self, transaction):

2911

def _writing(self, transaction):

2912

if self._trypending:

2912

if self._trypending:

2913

msg = b'try to write in a `trypending` revlog: %s'

2913

msg = b'try to write in a `trypending` revlog: %s'

2914

msg %= self.display_id

2914

msg %= self.display_id

2915

raise error.ProgrammingError(msg)

2915

raise error.ProgrammingError(msg)

2916

if self._inner.is_writing:

2916

if self._inner.is_writing:

2917

yield

2917

yield

2918

else:

2918

else:

2919

data_end = None

2919

data_end = None

2920

sidedata_end = None

2920

sidedata_end = None

2921

if self._docket is not None:

2921

if self._docket is not None:

2922

data_end = self._docket.data_end

2922

data_end = self._docket.data_end

2923

sidedata_end = self._docket.sidedata_end

2923

sidedata_end = self._docket.sidedata_end

2924

with self._inner.writing(

2924

with self._inner.writing(

2925

transaction,

2925

transaction,

2926

data_end=data_end,

2926

data_end=data_end,

2927

sidedata_end=sidedata_end,

2927

sidedata_end=sidedata_end,

2928

):

2928

):

2929

yield

2929

yield

2930

if self._docket is not None:

2930

if self._docket is not None:

2931

self._write_docket(transaction)

2931

self._write_docket(transaction)

2932

2933

@property

2933

@property

2934

def is_delaying(self):

2934

def is_delaying(self):

2935

return self._inner.is_delaying

2935

return self._inner.is_delaying

2936

2937

def _write_docket(self, transaction):

2937

def _write_docket(self, transaction):

2938

"""write the current docket on disk

2938

"""write the current docket on disk

2939

2940

Exist as a method to help changelog to implement transaction logic

2940

Exist as a method to help changelog to implement transaction logic

2941

2942

We could also imagine using the same transaction logic for all revlog

2942

We could also imagine using the same transaction logic for all revlog

2943

since docket are cheap."""

2943

since docket are cheap."""

2944

self._docket.write(transaction)

2944

self._docket.write(transaction)

2945

2946

def addrevision(

2946

def addrevision(

2947

self,

2947

self,

2948

text,

2948

text,

2949

transaction,

2949

transaction,

2950

link,

2950

link,

2951

p1,

2951

p1,

2952

p2,

2952

p2,

2953

cachedelta=None,

2953

cachedelta=None,

2954

node=None,

2954

node=None,

2955

flags=REVIDX_DEFAULT_FLAGS,

2955

flags=REVIDX_DEFAULT_FLAGS,

2956

deltacomputer=None,

2956

deltacomputer=None,

2957

sidedata=None,

2957

sidedata=None,

2958

):

2958

):

2959

"""add a revision to the log

2959

"""add a revision to the log

2960

2961

text - the revision data to add

2961

text - the revision data to add

2962

transaction - the transaction object used for rollback

2962

transaction - the transaction object used for rollback

2963

link - the linkrev data to add

2963

link - the linkrev data to add

2964

p1, p2 - the parent nodeids of the revision

2964

p1, p2 - the parent nodeids of the revision

2965

cachedelta - an optional precomputed delta

2965

cachedelta - an optional precomputed delta

2966

node - nodeid of revision; typically node is not specified, and it is

2966

node - nodeid of revision; typically node is not specified, and it is

2967

computed by default as hash(text, p1, p2), however subclasses might

2967

computed by default as hash(text, p1, p2), however subclasses might

2968

use different hashing method (and override checkhash() in such case)

2968

use different hashing method (and override checkhash() in such case)

2969

flags - the known flags to set on the revision

2969

flags - the known flags to set on the revision

2970

deltacomputer - an optional deltacomputer instance shared between

2970

deltacomputer - an optional deltacomputer instance shared between

2971

multiple calls

2971

multiple calls

2972

"""

2972

"""

2973

if link == nullrev:

2973

if link == nullrev:

2974

raise error.RevlogError(

2974

raise error.RevlogError(

2975

_(b"attempted to add linkrev -1 to %s") % self.display_id

2975

_(b"attempted to add linkrev -1 to %s") % self.display_id

2976

)

2976

)

2977

2978

if sidedata is None:

2978

if sidedata is None:

2979

sidedata = {}

2979

sidedata = {}

2980

elif sidedata and not self.feature_config.has_side_data:

2980

elif sidedata and not self.feature_config.has_side_data:

2981

raise error.ProgrammingError(

2981

raise error.ProgrammingError(

2982

_(b"trying to add sidedata to a revlog who don't support them")

2982

_(b"trying to add sidedata to a revlog who don't support them")

2983

)

2983

)

2984

2985

if flags:

2985

if flags:

2986

node = node or self.hash(text, p1, p2)

2986

node = node or self.hash(text, p1, p2)

2987

2988

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2988

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2989

2990

# If the flag processor modifies the revision data, ignore any provided

2990

# If the flag processor modifies the revision data, ignore any provided

2991

# cachedelta.

2991

# cachedelta.

2992

if rawtext != text:

2992

if rawtext != text:

2993

cachedelta = None

2993

cachedelta = None

2994

2995

if len(rawtext) > _maxentrysize:

2995

if len(rawtext) > _maxentrysize:

2996

raise error.RevlogError(

2996

raise error.RevlogError(

2997

_(

2997

_(

2998

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2998

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2999

)

2999

)

3000

% (self.display_id, len(rawtext))

3000

% (self.display_id, len(rawtext))

3001

)

3001

)

3002

3003

node = node or self.hash(rawtext, p1, p2)

3003

node = node or self.hash(rawtext, p1, p2)

3004

rev = self.index.get_rev(node)

3004

rev = self.index.get_rev(node)

3005

if rev is not None:

3005

if rev is not None:

3006

return rev

3006

return rev

3007

3008

if validatehash:

3008

if validatehash:

3009

self.checkhash(rawtext, node, p1=p1, p2=p2)

3009

self.checkhash(rawtext, node, p1=p1, p2=p2)

3010

3011

return self.addrawrevision(

3011

return self.addrawrevision(

3012

rawtext,

3012

rawtext,

3013

transaction,

3013

transaction,

3014

link,

3014

link,

3015

p1,

3015

p1,

3016

p2,

3016

p2,

3017

node,

3017

node,

3018

flags,

3018

flags,

3019

cachedelta=cachedelta,

3019

cachedelta=cachedelta,

3020

deltacomputer=deltacomputer,

3020

deltacomputer=deltacomputer,

3021

sidedata=sidedata,

3021

sidedata=sidedata,

3022

)

3022

)

3023

3024

def addrawrevision(

3024

def addrawrevision(

3025

self,

3025

self,

3026

rawtext,

3026

rawtext,

3027

transaction,

3027

transaction,

3028

link,

3028

link,

3029

p1,

3029

p1,

3030

p2,

3030

p2,

3031

node,

3031

node,

3032

flags,

3032

flags,

3033

cachedelta=None,

3033

cachedelta=None,

3034

deltacomputer=None,

3034

deltacomputer=None,

3035

sidedata=None,

3035

sidedata=None,

3036

):

3036

):

3037

"""add a raw revision with known flags, node and parents

3037

"""add a raw revision with known flags, node and parents

3038

useful when reusing a revision not stored in this revlog (ex: received

3038

useful when reusing a revision not stored in this revlog (ex: received

3039

over wire, or read from an external bundle).

3039

over wire, or read from an external bundle).

3040

"""

3040

"""

3041

with self._writing(transaction):

3041

with self._writing(transaction):

3042

return self._addrevision(

3042

return self._addrevision(

3043

node,

3043

node,

3044

rawtext,

3044

rawtext,

3045

transaction,

3045

transaction,

3046

link,

3046

link,

3047

p1,

3047

p1,

3048

p2,

3048

p2,

3049

flags,

3049

flags,

3050

cachedelta,

3050

cachedelta,

3051

deltacomputer=deltacomputer,

3051

deltacomputer=deltacomputer,

3052

sidedata=sidedata,

3052

sidedata=sidedata,

3053

)

3053

)

3054

3055

def compress(self, data):

3055

def compress(self, data):

3056

return self._inner.compress(data)

3056

return self._inner.compress(data)

3057

3058

def decompress(self, data):

3058

def decompress(self, data):

3059

return self._inner.decompress(data)

3059

return self._inner.decompress(data)

3060

3061

def _addrevision(

3061

def _addrevision(

3062

self,

3062

self,

3063

node,

3063

node,

3064

rawtext,

3064

rawtext,

3065

transaction,

3065

transaction,

3066

link,

3066

link,

3067

p1,

3067

p1,

3068

p2,

3068

p2,

3069

flags,

3069

flags,

3070

cachedelta,

3070

cachedelta,

3071

alwayscache=False,

3071

alwayscache=False,

3072

deltacomputer=None,

3072

deltacomputer=None,

3073

sidedata=None,

3073

sidedata=None,

3074

):

3074

):

3075

"""internal function to add revisions to the log

3075

"""internal function to add revisions to the log

3076

3077

see addrevision for argument descriptions.

3077

see addrevision for argument descriptions.

3078

3079

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

3079

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

3080

3081

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

3081

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

3082

be used.

3082

be used.

3083

3084

invariants:

3084

invariants:

3085

- rawtext is optional (can be None); if not set, cachedelta must be set.

3085

- rawtext is optional (can be None); if not set, cachedelta must be set.

3086

if both are set, they must correspond to each other.

3086

if both are set, they must correspond to each other.

3087

"""

3087

"""

3088

if node == self.nullid:

3088

if node == self.nullid:

3089

raise error.RevlogError(

3089

raise error.RevlogError(

3090

_(b"%s: attempt to add null revision") % self.display_id

3090

_(b"%s: attempt to add null revision") % self.display_id

3091

)

3091

)

3092

if (

3092

if (

3093

node == self.nodeconstants.wdirid

3093

node == self.nodeconstants.wdirid

3094

or node in self.nodeconstants.wdirfilenodeids

3094

or node in self.nodeconstants.wdirfilenodeids

3095

):

3095

):

3096

raise error.RevlogError(

3096

raise error.RevlogError(

3097

_(b"%s: attempt to add wdir revision") % self.display_id

3097

_(b"%s: attempt to add wdir revision") % self.display_id

3098

)

3098

)

3099

if self._inner._writinghandles is None:

3099

if self._inner._writinghandles is None:

3100

msg = b'adding revision outside `revlog._writing` context'

3100

msg = b'adding revision outside `revlog._writing` context'

3101

raise error.ProgrammingError(msg)

3101

raise error.ProgrammingError(msg)

3102

3103

btext = [rawtext]

3103

btext = [rawtext]

3104

3105

curr = len(self)

3105

curr = len(self)

3106

prev = curr - 1

3106

prev = curr - 1

3107

3108

offset = self._get_data_offset(prev)

3108

offset = self._get_data_offset(prev)

3109

3110

if self._concurrencychecker:

3110

if self._concurrencychecker:

3111

ifh, dfh, sdfh = self._inner._writinghandles

3111

ifh, dfh, sdfh = self._inner._writinghandles

3112

# XXX no checking for the sidedata file

3112

# XXX no checking for the sidedata file

3113

if self._inline:

3113

if self._inline:

3114

# offset is "as if" it were in the .d file, so we need to add on

3114

# offset is "as if" it were in the .d file, so we need to add on

3115

# the size of the entry metadata.

3115

# the size of the entry metadata.

3116

self._concurrencychecker(

3116

self._concurrencychecker(

3117

ifh, self._indexfile, offset + curr * self.index.entry_size

3117

ifh, self._indexfile, offset + curr * self.index.entry_size

3118

)

3118

)

3119

else:

3119

else:

3120

# Entries in the .i are a consistent size.

3120

# Entries in the .i are a consistent size.

3121

self._concurrencychecker(

3121

self._concurrencychecker(

3122

ifh, self._indexfile, curr * self.index.entry_size

3122

ifh, self._indexfile, curr * self.index.entry_size

3123

)

3123

)

3124

self._concurrencychecker(dfh, self._datafile, offset)

3124

self._concurrencychecker(dfh, self._datafile, offset)

3125

3126

p1r, p2r = self.rev(p1), self.rev(p2)

3126

p1r, p2r = self.rev(p1), self.rev(p2)

3127

3128

# full versions are inserted when the needed deltas

3128

# full versions are inserted when the needed deltas

3129

# become comparable to the uncompressed text

3129

# become comparable to the uncompressed text

3130

if rawtext is None:

3130

if rawtext is None:

3131

# need rawtext size, before changed by flag processors, which is

3131

# need rawtext size, before changed by flag processors, which is

3132

# the non-raw size. use revlog explicitly to avoid filelog's extra

3132

# the non-raw size. use revlog explicitly to avoid filelog's extra

3133

# logic that might remove metadata size.

3133

# logic that might remove metadata size.

3134

textlen = mdiff.patchedsize(

3134

textlen = mdiff.patchedsize(

3135

revlog.size(self, cachedelta[0]), cachedelta[1]

3135

revlog.size(self, cachedelta[0]), cachedelta[1]

3136

)

3136

)

3137

else:

3137

else:

3138

textlen = len(rawtext)

3138

textlen = len(rawtext)

3139

3140

if deltacomputer is None:

3140

if deltacomputer is None:

3141

write_debug = None

3141

write_debug = None

3142

if self.delta_config.debug_delta:

3142

if self.delta_config.debug_delta:

3143

write_debug = transaction._report

3143

write_debug = transaction._report

3144

deltacomputer = deltautil.deltacomputer(

3144

deltacomputer = deltautil.deltacomputer(

3145

self, write_debug=write_debug

3145

self, write_debug=write_debug

3146

)

3146

)

3147

3148

if cachedelta is not None and len(cachedelta) == 2:

3148

if cachedelta is not None and len(cachedelta) == 2:

3149

# If the cached delta has no information about how it should be

3149

# If the cached delta has no information about how it should be

3150

# reused, add the default reuse instruction according to the

3150

# reused, add the default reuse instruction according to the

3151

# revlog's configuration.

3151

# revlog's configuration.

3152

if (

3152

if (

3153

self.delta_config.general_delta

3153

self.delta_config.general_delta

3154

and self.delta_config.lazy_delta_base

3154

and self.delta_config.lazy_delta_base

3155

):

3155

):

3156

delta_base_reuse = DELTA_BASE_REUSE_TRY

3156

delta_base_reuse = DELTA_BASE_REUSE_TRY

3157

else:

3157

else:

3158

delta_base_reuse = DELTA_BASE_REUSE_NO

3158

delta_base_reuse = DELTA_BASE_REUSE_NO

3159

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

3159

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

3160

3161

revinfo = revlogutils.revisioninfo(

3161

revinfo = revlogutils.revisioninfo(

3162

node,

3162

node,

3163

p1,

3163

p1,

3164

p2,

3164

p2,

3165

btext,

3165

btext,

3166

textlen,

3166

textlen,

3167

cachedelta,

3167

cachedelta,

3168

flags,

3168

flags,

3169

)

3169

)

3170

3171

deltainfo = deltacomputer.finddeltainfo(revinfo)

3171

deltainfo = deltacomputer.finddeltainfo(revinfo)

3172

3173

compression_mode = COMP_MODE_INLINE

3173

compression_mode = COMP_MODE_INLINE

3174

if self._docket is not None:

3174

if self._docket is not None:

3175

default_comp = self._docket.default_compression_header

3175

default_comp = self._docket.default_compression_header

3176

r = deltautil.delta_compression(default_comp, deltainfo)

3176

r = deltautil.delta_compression(default_comp, deltainfo)

3177

compression_mode, deltainfo = r

3177

compression_mode, deltainfo = r

3178

3179

sidedata_compression_mode = COMP_MODE_INLINE

3179

sidedata_compression_mode = COMP_MODE_INLINE

3180

if sidedata and self.feature_config.has_side_data:

3180

if sidedata and self.feature_config.has_side_data:

3181

sidedata_compression_mode = COMP_MODE_PLAIN

3181

sidedata_compression_mode = COMP_MODE_PLAIN

3182

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

3182

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

3183

sidedata_offset = self._docket.sidedata_end

3183

sidedata_offset = self._docket.sidedata_end

3184

h, comp_sidedata = self._inner.compress(serialized_sidedata)

3184

h, comp_sidedata = self._inner.compress(serialized_sidedata)

3185

if (

3185

if (

3186

h != b'u'

3186

h != b'u'

3187

and comp_sidedata[0:1] != b'\0'

3187

and comp_sidedata[0:1] != b'\0'

3188

and len(comp_sidedata) < len(serialized_sidedata)

3188

and len(comp_sidedata) < len(serialized_sidedata)

3189

):

3189

):

3190

assert not h

3190

assert not h

3191

if (

3191

if (

3192

comp_sidedata[0:1]

3192

comp_sidedata[0:1]

3193

== self._docket.default_compression_header

3193

== self._docket.default_compression_header

3194

):

3194

):

3195

sidedata_compression_mode = COMP_MODE_DEFAULT

3195

sidedata_compression_mode = COMP_MODE_DEFAULT

3196

serialized_sidedata = comp_sidedata

3196

serialized_sidedata = comp_sidedata

3197

else:

3197

else:

3198

sidedata_compression_mode = COMP_MODE_INLINE

3198

sidedata_compression_mode = COMP_MODE_INLINE

3199

serialized_sidedata = comp_sidedata

3199

serialized_sidedata = comp_sidedata

3200

else:

3200

else:

3201

serialized_sidedata = b""

3201

serialized_sidedata = b""

3202

# Don't store the offset if the sidedata is empty, that way

3202

# Don't store the offset if the sidedata is empty, that way

3203

# we can easily detect empty sidedata and they will be no different

3203

# we can easily detect empty sidedata and they will be no different

3204

# than ones we manually add.

3204

# than ones we manually add.

3205

sidedata_offset = 0

3205

sidedata_offset = 0

3206

3207

rank = RANK_UNKNOWN

3207

rank = RANK_UNKNOWN

3208

if self.feature_config.compute_rank:

3208

if self.feature_config.compute_rank:

3209

if (p1r, p2r) == (nullrev, nullrev):

3209

if (p1r, p2r) == (nullrev, nullrev):

3210

rank = 1

3210

rank = 1

3211

elif p1r != nullrev and p2r == nullrev:

3211

elif p1r != nullrev and p2r == nullrev:

3212

rank = 1 + self.fast_rank(p1r)

3212

rank = 1 + self.fast_rank(p1r)

3213

elif p1r == nullrev and p2r != nullrev:

3213

elif p1r == nullrev and p2r != nullrev:

3214

rank = 1 + self.fast_rank(p2r)

3214

rank = 1 + self.fast_rank(p2r)

3215

else: # merge node

3215

else: # merge node

3216

if rustdagop is not None and self.index.rust_ext_compat:

3216

if rustdagop is not None and self.index.rust_ext_compat:

3217

rank = rustdagop.rank(self.index, p1r, p2r)

3217

rank = rustdagop.rank(self.index, p1r, p2r)

3218

else:

3218

else:

3219

pmin, pmax = sorted((p1r, p2r))

3219

pmin, pmax = sorted((p1r, p2r))

3220

rank = 1 + self.fast_rank(pmax)

3220

rank = 1 + self.fast_rank(pmax)

3221

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

3221

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

3222

3223

e = revlogutils.entry(

3223

e = revlogutils.entry(

3224

flags=flags,

3224

flags=flags,

3225

data_offset=offset,

3225

data_offset=offset,

3226

data_compressed_length=deltainfo.deltalen,

3226

data_compressed_length=deltainfo.deltalen,

3227

data_uncompressed_length=textlen,

3227

data_uncompressed_length=textlen,

3228

data_compression_mode=compression_mode,

3228

data_compression_mode=compression_mode,

3229

data_delta_base=deltainfo.base,

3229

data_delta_base=deltainfo.base,

3230

link_rev=link,

3230

link_rev=link,

3231

parent_rev_1=p1r,

3231

parent_rev_1=p1r,

3232

parent_rev_2=p2r,

3232

parent_rev_2=p2r,

3233

node_id=node,

3233

node_id=node,

3234

sidedata_offset=sidedata_offset,

3234

sidedata_offset=sidedata_offset,

3235

sidedata_compressed_length=len(serialized_sidedata),

3235

sidedata_compressed_length=len(serialized_sidedata),

3236

sidedata_compression_mode=sidedata_compression_mode,

3236

sidedata_compression_mode=sidedata_compression_mode,

3237

rank=rank,

3237

rank=rank,

3238

)

3238

)

3239

3240

self.index.append(e)

3240

self.index.append(e)

3241

entry = self.index.entry_binary(curr)

3241

entry = self.index.entry_binary(curr)

3242

if curr == 0 and self._docket is None:

3242

if curr == 0 and self._docket is None:

3243

header = self._format_flags | self._format_version

3243

header = self._format_flags | self._format_version

3244

header = self.index.pack_header(header)

3244

header = self.index.pack_header(header)

3245

entry = header + entry

3245

entry = header + entry

3246

self._writeentry(

3246

self._writeentry(

3247

transaction,

3247

transaction,

3248

entry,

3248

entry,

3249

deltainfo.data,

3249

deltainfo.data,

3250

link,

3250

link,

3251

offset,

3251

offset,

3252

serialized_sidedata,

3252

serialized_sidedata,

3253

sidedata_offset,

3253

sidedata_offset,

3254

)

3254

)

3255

3256

rawtext = btext[0]

3256

rawtext = btext[0]

3257

3258

if alwayscache and rawtext is None:

3258

if alwayscache and rawtext is None:

3259

rawtext = deltacomputer.buildtext(revinfo)

3259

rawtext = deltacomputer.buildtext(revinfo)

3260

3261

if type(rawtext) == bytes: # only accept immutable objects

3261

if type(rawtext) == bytes: # only accept immutable objects

3262

self._inner._revisioncache = (node, curr, rawtext)

3262

self._inner._revisioncache = (node, curr, rawtext)

3263

self._chainbasecache[curr] = deltainfo.chainbase

3263

self._chainbasecache[curr] = deltainfo.chainbase

3264

return curr

3264

return curr

3265

3266

def _get_data_offset(self, prev):

3266

def _get_data_offset(self, prev):

3267

"""Returns the current offset in the (in-transaction) data file.

3267

"""Returns the current offset in the (in-transaction) data file.

3268

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

3268

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

3269

file to store that information: since sidedata can be rewritten to the

3269

file to store that information: since sidedata can be rewritten to the

3270

end of the data file within a transaction, you can have cases where, for

3270

end of the data file within a transaction, you can have cases where, for

3271

example, rev `n` does not have sidedata while rev `n - 1` does, leading

3271

example, rev `n` does not have sidedata while rev `n - 1` does, leading

3272

to `n - 1`'s sidedata being written after `n`'s data.

3272

to `n - 1`'s sidedata being written after `n`'s data.

3273

3274

TODO cache this in a docket file before getting out of experimental."""

3274

TODO cache this in a docket file before getting out of experimental."""

3275

if self._docket is None:

3275

if self._docket is None:

3276

return self.end(prev)

3276

return self.end(prev)

3277

else:

3277

else:

3278

return self._docket.data_end

3278

return self._docket.data_end

3279

3280

def _writeentry(

3280

def _writeentry(

3281

self,

3281

self,

3282

transaction,

3282

transaction,

3283

entry,

3283

entry,

3284

data,

3284

data,

3285

link,

3285

link,

3286

offset,

3286

offset,

3287

sidedata,

3287

sidedata,

3288

sidedata_offset,

3288

sidedata_offset,

3289

):

3289

):

3290

# Files opened in a+ mode have inconsistent behavior on various

3290

# Files opened in a+ mode have inconsistent behavior on various

3291

# platforms. Windows requires that a file positioning call be made

3291

# platforms. Windows requires that a file positioning call be made

3292

# when the file handle transitions between reads and writes. See

3292

# when the file handle transitions between reads and writes. See

3293

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

3293

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

3294

# platforms, Python or the platform itself can be buggy. Some versions

3294

# platforms, Python or the platform itself can be buggy. Some versions

3295

# of Solaris have been observed to not append at the end of the file

3295

# of Solaris have been observed to not append at the end of the file

3296

# if the file was seeked to before the end. See issue4943 for more.

3296

# if the file was seeked to before the end. See issue4943 for more.

3297

#

3297

#

3298

# We work around this issue by inserting a seek() before writing.

3298

# We work around this issue by inserting a seek() before writing.

3299

# Note: This is likely not necessary on Python 3. However, because

3299

# Note: This is likely not necessary on Python 3. However, because

3300

# the file handle is reused for reads and may be seeked there, we need

3300

# the file handle is reused for reads and may be seeked there, we need

3301

# to be careful before changing this.

3301

# to be careful before changing this.

3302

index_end = data_end = sidedata_end = None

3302

index_end = data_end = sidedata_end = None

3303

if self._docket is not None:

3303

if self._docket is not None:

3304

index_end = self._docket.index_end

3304

index_end = self._docket.index_end

3305

data_end = self._docket.data_end

3305

data_end = self._docket.data_end

3306

sidedata_end = self._docket.sidedata_end

3306

sidedata_end = self._docket.sidedata_end

3307

3308

files_end = self._inner.write_entry(

3308

files_end = self._inner.write_entry(

3309

transaction,

3309

transaction,

3310

entry,

3310

entry,

3311

data,

3311

data,

3312

link,

3312

link,

3313

offset,

3313

offset,

3314

sidedata,

3314

sidedata,

3315

sidedata_offset,

3315

sidedata_offset,

3316

index_end,

3316

index_end,

3317

data_end,

3317

data_end,

3318

sidedata_end,

3318

sidedata_end,

3319

)

3319

)

3320

self._enforceinlinesize(transaction)

3320

self._enforceinlinesize(transaction)

3321

if self._docket is not None:

3321

if self._docket is not None:

3322

self._docket.index_end = files_end[0]

3322

self._docket.index_end = files_end[0]

3323

self._docket.data_end = files_end[1]

3323

self._docket.data_end = files_end[1]

3324

self._docket.sidedata_end = files_end[2]

3324

self._docket.sidedata_end = files_end[2]

3325

3326

nodemaputil.setup_persistent_nodemap(transaction, self)

3326

nodemaputil.setup_persistent_nodemap(transaction, self)

3327

3328

def addgroup(

3328

def addgroup(

3329

self,

3329

self,

3330

deltas,

3330

deltas,

3331

linkmapper,

3331

linkmapper,

3332

transaction,

3332

transaction,

3333

alwayscache=False,

3333

alwayscache=False,

3334

addrevisioncb=None,

3334

addrevisioncb=None,

3335

duplicaterevisioncb=None,

3335

duplicaterevisioncb=None,

3336

debug_info=None,

3336

debug_info=None,

3337

delta_base_reuse_policy=None,

3337

delta_base_reuse_policy=None,

3338

):

3338

):

3339

"""

3339

"""

3340

add a delta group

3340

add a delta group

3341

3342

given a set of deltas, add them to the revision log. the

3342

given a set of deltas, add them to the revision log. the

3343

first delta is against its parent, which should be in our

3343

first delta is against its parent, which should be in our

3344

log, the rest are against the previous delta.

3344

log, the rest are against the previous delta.

3345

3346

If ``addrevisioncb`` is defined, it will be called with arguments of

3346

If ``addrevisioncb`` is defined, it will be called with arguments of

3347

this revlog and the node that was added.

3347

this revlog and the node that was added.

3348

"""

3348

"""

3349

3350

if self._adding_group:

3350

if self._adding_group:

3351

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3351

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3352

3353

# read the default delta-base reuse policy from revlog config if the

3353

# read the default delta-base reuse policy from revlog config if the

3354

# group did not specify one.

3354

# group did not specify one.

3355

if delta_base_reuse_policy is None:

3355

if delta_base_reuse_policy is None:

3356

if (

3356

if (

3357

self.delta_config.general_delta

3357

self.delta_config.general_delta

3358

and self.delta_config.lazy_delta_base

3358

and self.delta_config.lazy_delta_base

3359

):

3359

):

3360

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3360

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3361

else:

3361

else:

3362

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3362

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3363

3364

self._adding_group = True

3364

self._adding_group = True

3365

empty = True

3365

empty = True

3366

try:

3366

try:

3367

with self._writing(transaction):

3367

with self._writing(transaction):

3368

write_debug = None

3368

write_debug = None

3369

if self.delta_config.debug_delta:

3369

if self.delta_config.debug_delta:

3370

write_debug = transaction._report

3370

write_debug = transaction._report

3371

deltacomputer = deltautil.deltacomputer(

3371

deltacomputer = deltautil.deltacomputer(

3372

self,

3372

self,

3373

write_debug=write_debug,

3373

write_debug=write_debug,

3374

debug_info=debug_info,

3374

debug_info=debug_info,

3375

)

3375

)

3376

# loop through our set of deltas

3376

# loop through our set of deltas

3377

for data in deltas:

3377

for data in deltas:

3378

(

3378

(

3379

node,

3379

node,

3380

p1,

3380

p1,

3381

p2,

3381

p2,

3382

linknode,

3382

linknode,

3383

deltabase,

3383

deltabase,

3384

delta,

3384

delta,

3385

flags,

3385

flags,

3386

sidedata,

3386

sidedata,

3387

) = data

3387

) = data

3388

link = linkmapper(linknode)

3388

link = linkmapper(linknode)

3389

flags = flags or REVIDX_DEFAULT_FLAGS

3389

flags = flags or REVIDX_DEFAULT_FLAGS

3390

3391

rev = self.index.get_rev(node)

3391

rev = self.index.get_rev(node)

3392

if rev is not None:

3392

if rev is not None:

3393

# this can happen if two branches make the same change

3393

# this can happen if two branches make the same change

3394

self._nodeduplicatecallback(transaction, rev)

3394

self._nodeduplicatecallback(transaction, rev)

3395

if duplicaterevisioncb:

3395

if duplicaterevisioncb:

3396

duplicaterevisioncb(self, rev)

3396

duplicaterevisioncb(self, rev)

3397

empty = False

3397

empty = False

3398

continue

3398

continue

3399

3400

for p in (p1, p2):

3400

for p in (p1, p2):

3401

if not self.index.has_node(p):

3401

if not self.index.has_node(p):

3402

raise error.LookupError(

3402

raise error.LookupError(

3403

p, self.radix, _(b'unknown parent')

3403

p, self.radix, _(b'unknown parent')

3404

)

3404

)

3405

3406

if not self.index.has_node(deltabase):

3406

if not self.index.has_node(deltabase):

3407

raise error.LookupError(

3407

raise error.LookupError(

3408

deltabase, self.display_id, _(b'unknown delta base')

3408

deltabase, self.display_id, _(b'unknown delta base')

3409

)

3409

)

3410

3411

baserev = self.rev(deltabase)

3411

baserev = self.rev(deltabase)

3412

3413

if baserev != nullrev and self.iscensored(baserev):

3413

if baserev != nullrev and self.iscensored(baserev):

3414

# if base is censored, delta must be full replacement in a

3414

# if base is censored, delta must be full replacement in a

3415

# single patch operation

3415

# single patch operation

3416

hlen = struct.calcsize(b">lll")

3416

hlen = struct.calcsize(b">lll")

3417

oldlen = self.rawsize(baserev)

3417

oldlen = self.rawsize(baserev)

3418

newlen = len(delta) - hlen

3418

newlen = len(delta) - hlen

3419

if delta[:hlen] != mdiff.replacediffheader(

3419

if delta[:hlen] != mdiff.replacediffheader(

3420

oldlen, newlen

3420

oldlen, newlen

3421

):

3421

):

3422

raise error.CensoredBaseError(

3422

raise error.CensoredBaseError(

3423

self.display_id, self.node(baserev)

3423

self.display_id, self.node(baserev)

3424

)

3424

)

3425

3426

if not flags and self._peek_iscensored(baserev, delta):

3426

if not flags and self._peek_iscensored(baserev, delta):

3427

flags |= REVIDX_ISCENSORED

3427

flags |= REVIDX_ISCENSORED

3428

3429

# We assume consumers of addrevisioncb will want to retrieve

3429

# We assume consumers of addrevisioncb will want to retrieve

3430

# the added revision, which will require a call to

3430

# the added revision, which will require a call to

3431

# revision(). revision() will fast path if there is a cache

3431

# revision(). revision() will fast path if there is a cache

3432

# hit. So, we tell _addrevision() to always cache in this case.

3432

# hit. So, we tell _addrevision() to always cache in this case.

3433

# We're only using addgroup() in the context of changegroup

3433

# We're only using addgroup() in the context of changegroup

3434

# generation so the revision data can always be handled as raw

3434

# generation so the revision data can always be handled as raw

3435

# by the flagprocessor.

3435

# by the flagprocessor.

3436

rev = self._addrevision(

3436

rev = self._addrevision(

3437

node,

3437

node,

3438

None,

3438

None,

3439

transaction,

3439

transaction,

3440

link,

3440

link,

3441

p1,

3441

p1,

3442

p2,

3442

p2,

3443

flags,

3443

flags,

3444

(baserev, delta, delta_base_reuse_policy),

3444

(baserev, delta, delta_base_reuse_policy),

3445

alwayscache=alwayscache,

3445

alwayscache=alwayscache,

3446

deltacomputer=deltacomputer,

3446

deltacomputer=deltacomputer,

3447

sidedata=sidedata,

3447

sidedata=sidedata,

3448

)

3448

)

3449

3450

if addrevisioncb:

3450

if addrevisioncb:

3451

addrevisioncb(self, rev)

3451

addrevisioncb(self, rev)

3452

empty = False

3452

empty = False

3453

finally:

3453

finally:

3454

self._adding_group = False

3454

self._adding_group = False

3455

return not empty

3455

return not empty

3456

3457

def iscensored(self, rev):

3457

def iscensored(self, rev):

3458

"""Check if a file revision is censored."""

3458

"""Check if a file revision is censored."""

3459

if not self.feature_config.censorable:

3459

if not self.feature_config.censorable:

3460

return False

3460

return False

3461

3462

return self.flags(rev) & REVIDX_ISCENSORED

3462

return self.flags(rev) & REVIDX_ISCENSORED

3463

3464

def _peek_iscensored(self, baserev, delta):

3464

def _peek_iscensored(self, baserev, delta):

3465

"""Quickly check if a delta produces a censored revision."""

3465

"""Quickly check if a delta produces a censored revision."""

3466

if not self.feature_config.censorable:

3466

if not self.feature_config.censorable:

3467

return False

3467

return False

3468

3469

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3469

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3470

3471

def getstrippoint(self, minlink):

3471

def getstrippoint(self, minlink):

3472

"""find the minimum rev that must be stripped to strip the linkrev

3472

"""find the minimum rev that must be stripped to strip the linkrev

3473

3474

Returns a tuple containing the minimum rev and a set of all revs that

3474

Returns a tuple containing the minimum rev and a set of all revs that

3475

have linkrevs that will be broken by this strip.

3475

have linkrevs that will be broken by this strip.

3476

"""

3476

"""

3477

return storageutil.resolvestripinfo(

3477

return storageutil.resolvestripinfo(

3478

minlink,

3478

minlink,

3479

len(self) - 1,

3479

len(self) - 1,

3480

self.headrevs(),

3480

self.headrevs(),

3481

self.linkrev,

3481

self.linkrev,

3482

self.parentrevs,

3482

self.parentrevs,

3483

)

3483

)

3484

3485

def strip(self, minlink, transaction):

3485

def strip(self, minlink, transaction):

3486

"""truncate the revlog on the first revision with a linkrev >= minlink

3486

"""truncate the revlog on the first revision with a linkrev >= minlink

3487

3488

This function is called when we're stripping revision minlink and

3488

This function is called when we're stripping revision minlink and

3489

its descendants from the repository.

3489

its descendants from the repository.

3490

3491

We have to remove all revisions with linkrev >= minlink, because

3491

We have to remove all revisions with linkrev >= minlink, because

3492

the equivalent changelog revisions will be renumbered after the

3492

the equivalent changelog revisions will be renumbered after the

3493

strip.

3493

strip.

3494

3495

So we truncate the revlog on the first of these revisions, and

3495

So we truncate the revlog on the first of these revisions, and

3496

trust that the caller has saved the revisions that shouldn't be

3496

trust that the caller has saved the revisions that shouldn't be

3497

removed and that it'll re-add them after this truncation.

3497

removed and that it'll re-add them after this truncation.

3498

"""

3498

"""

3499

if len(self) == 0:

3499

if len(self) == 0:

3500

return

3500

return

3501

3502

rev, _ = self.getstrippoint(minlink)

3502

rev, _ = self.getstrippoint(minlink)

3503

if rev == len(self):

3503

if rev == len(self):

3504

return

3504

return

3505

3506

# first truncate the files on disk

3506

# first truncate the files on disk

3507

data_end = self.start(rev)

3507

data_end = self.start(rev)

3508

if not self._inline:

3508

if not self._inline:

3509

transaction.add(self._datafile, data_end)

3509

transaction.add(self._datafile, data_end)

3510

end = rev * self.index.entry_size

3510

end = rev * self.index.entry_size

3511

else:

3511

else:

3512

end = data_end + (rev * self.index.entry_size)

3512

end = data_end + (rev * self.index.entry_size)

3513

3514

if self._sidedatafile:

3514

if self._sidedatafile:

3515

sidedata_end = self.sidedata_cut_off(rev)

3515

sidedata_end = self.sidedata_cut_off(rev)

3516

transaction.add(self._sidedatafile, sidedata_end)

3516

transaction.add(self._sidedatafile, sidedata_end)

3517

3518

transaction.add(self._indexfile, end)

3518

transaction.add(self._indexfile, end)

3519

if self._docket is not None:

3519

if self._docket is not None:

3520

# XXX we could, leverage the docket while stripping. However it is

3520

# XXX we could, leverage the docket while stripping. However it is

3521

# not powerfull enough at the time of this comment

3521

# not powerfull enough at the time of this comment

3522

self._docket.index_end = end

3522

self._docket.index_end = end

3523

self._docket.data_end = data_end

3523

self._docket.data_end = data_end

3524

self._docket.sidedata_end = sidedata_end

3524

self._docket.sidedata_end = sidedata_end

3525

self._docket.write(transaction, stripping=True)

3525

self._docket.write(transaction, stripping=True)

3526

3527

# then reset internal state in memory to forget those revisions

3527

# then reset internal state in memory to forget those revisions

3528

self._chaininfocache = util.lrucachedict(500)

3528

self._chaininfocache = util.lrucachedict(500)

3529

self._inner.clear_cache()

3529

self._inner.clear_cache()

3530

3531

del self.index[rev:-1]

3531

del self.index[rev:-1]

3532

3533

def checksize(self):

3533

def checksize(self):

3534

"""Check size of index and data files

3534

"""Check size of index and data files

3535

3536

return a (dd, di) tuple.

3536

return a (dd, di) tuple.

3537

- dd: extra bytes for the "data" file

3537

- dd: extra bytes for the "data" file

3538

- di: extra bytes for the "index" file

3538

- di: extra bytes for the "index" file

3539

3540

A healthy revlog will return (0, 0).

3540

A healthy revlog will return (0, 0).

3541

"""

3541

"""

3542

expected = 0

3542

expected = 0

3543

if len(self):

3543

if len(self):

3544

expected = max(0, self.end(len(self) - 1))

3544

expected = max(0, self.end(len(self) - 1))

3545

3546

try:

3546

try:

3547

with self._datafp() as f:

3547

with self._datafp() as f:

3548

f.seek(0, io.SEEK_END)

3548

f.seek(0, io.SEEK_END)

3549

actual = f.tell()

3549

actual = f.tell()

3550

dd = actual - expected

3550

dd = actual - expected

3551

except FileNotFoundError:

3551

except FileNotFoundError:

3552

dd = 0

3552

dd = 0

3553

3554

try:

3554

try:

3555

f = self.opener(self._indexfile)

3555

f = self.opener(self._indexfile)

3556

f.seek(0, io.SEEK_END)

3556

f.seek(0, io.SEEK_END)

3557

actual = f.tell()

3557

actual = f.tell()

3558

f.close()

3558

f.close()

3559

s = self.index.entry_size

3559

s = self.index.entry_size

3560

i = max(0, actual // s)

3560

i = max(0, actual // s)

3561

di = actual - (i * s)

3561

di = actual - (i * s)

3562

if self._inline:

3562

if self._inline:

3563

databytes = 0

3563

databytes = 0

3564

for r in self:

3564

for r in self:

3565

databytes += max(0, self.length(r))

3565

databytes += max(0, self.length(r))

3566

dd = 0

3566

dd = 0

3567

di = actual - len(self) * s - databytes

3567

di = actual - len(self) * s - databytes

3568

except FileNotFoundError:

3568

except FileNotFoundError:

3569

di = 0

3569

di = 0

3570

3571

return (dd, di)

3571

return (dd, di)

3572

3573

def files(self):

3573

def files(self):

3574

"""return list of files that compose this revlog"""

3574

"""return list of files that compose this revlog"""

3575

res = [self._indexfile]

3575

res = [self._indexfile]

3576

if self._docket_file is None:

3576

if self._docket_file is None:

3577

if not self._inline:

3577

if not self._inline:

3578

res.append(self._datafile)

3578

res.append(self._datafile)

3579

else:

3579

else:

3580

res.append(self._docket_file)

3580

res.append(self._docket_file)

3581

res.extend(self._docket.old_index_filepaths(include_empty=False))

3581

res.extend(self._docket.old_index_filepaths(include_empty=False))

3582

if self._docket.data_end:

3582

if self._docket.data_end:

3583

res.append(self._datafile)

3583

res.append(self._datafile)

3584

res.extend(self._docket.old_data_filepaths(include_empty=False))

3584

res.extend(self._docket.old_data_filepaths(include_empty=False))

3585

if self._docket.sidedata_end:

3585

if self._docket.sidedata_end:

3586

res.append(self._sidedatafile)

3586

res.append(self._sidedatafile)

3587

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3587

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3588

return res

3588

return res

3589

3590

def emitrevisions(

3590

def emitrevisions(

3591

self,

3591

self,

3592

nodes,

3592

nodes,

3593

nodesorder=None,

3593

nodesorder=None,

3594

revisiondata=False,

3594

revisiondata=False,

3595

assumehaveparentrevisions=False,

3595

assumehaveparentrevisions=False,

3596

deltamode=repository.CG_DELTAMODE_STD,

3596

deltamode=repository.CG_DELTAMODE_STD,

3597

sidedata_helpers=None,

3597

sidedata_helpers=None,

3598

debug_info=None,

3598

debug_info=None,

3599

):

3599

):

3600

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3600

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3601

raise error.ProgrammingError(

3601

raise error.ProgrammingError(

3602

b'unhandled value for nodesorder: %s' % nodesorder

3602

b'unhandled value for nodesorder: %s' % nodesorder

3603

)

3603

)

3604

3605

if nodesorder is None and not self.delta_config.general_delta:

3605

if nodesorder is None and not self.delta_config.general_delta:

3606

nodesorder = b'storage'

3606

nodesorder = b'storage'

3607

3608

if (

3608

if (

3609

not self._storedeltachains

3609

not self._storedeltachains

3610

and deltamode != repository.CG_DELTAMODE_PREV

3610

and deltamode != repository.CG_DELTAMODE_PREV

3611

):

3611

):

3612

deltamode = repository.CG_DELTAMODE_FULL

3612

deltamode = repository.CG_DELTAMODE_FULL

3613

3614

return storageutil.emitrevisions(

3614

return storageutil.emitrevisions(

3615

self,

3615

self,

3616

nodes,

3616

nodes,

3617

nodesorder,

3617

nodesorder,

3618

revlogrevisiondelta,

3618

revlogrevisiondelta,

3619

deltaparentfn=self.deltaparent,

3619

deltaparentfn=self.deltaparent,

3620

candeltafn=self._candelta,

3620

candeltafn=self._candelta,

3621

rawsizefn=self.rawsize,

3621

rawsizefn=self.rawsize,

3622

revdifffn=self.revdiff,

3622

revdifffn=self.revdiff,

3623

flagsfn=self.flags,

3623

flagsfn=self.flags,

3624

deltamode=deltamode,

3624

deltamode=deltamode,

3625

revisiondata=revisiondata,

3625

revisiondata=revisiondata,

3626

assumehaveparentrevisions=assumehaveparentrevisions,

3626

assumehaveparentrevisions=assumehaveparentrevisions,

3627

sidedata_helpers=sidedata_helpers,

3627

sidedata_helpers=sidedata_helpers,

3628

debug_info=debug_info,

3628

debug_info=debug_info,

3629

)

3629

)

3630

3631

DELTAREUSEALWAYS = b'always'

3631

DELTAREUSEALWAYS = b'always'

3632

DELTAREUSESAMEREVS = b'samerevs'

3632

DELTAREUSESAMEREVS = b'samerevs'

3633

DELTAREUSENEVER = b'never'

3633

DELTAREUSENEVER = b'never'

3634

3635

DELTAREUSEFULLADD = b'fulladd'

3635

DELTAREUSEFULLADD = b'fulladd'

3636

3637

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3637

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3638

3639

def clone(

3639

def clone(

3640

self,

3640

self,

3641

tr,

3641

tr,

3642

destrevlog,

3642

destrevlog,

3643

addrevisioncb=None,

3643

addrevisioncb=None,

3644

deltareuse=DELTAREUSESAMEREVS,

3644

deltareuse=DELTAREUSESAMEREVS,

3645

forcedeltabothparents=None,

3645

forcedeltabothparents=None,

3646

sidedata_helpers=None,

3646

sidedata_helpers=None,

3647

):

3647

):

3648

"""Copy this revlog to another, possibly with format changes.

3648

"""Copy this revlog to another, possibly with format changes.

3649

3650

The destination revlog will contain the same revisions and nodes.

3650

The destination revlog will contain the same revisions and nodes.

3651

However, it may not be bit-for-bit identical due to e.g. delta encoding

3651

However, it may not be bit-for-bit identical due to e.g. delta encoding

3652

differences.

3652

differences.

3653

3654

The ``deltareuse`` argument control how deltas from the existing revlog

3654

The ``deltareuse`` argument control how deltas from the existing revlog

3655

are preserved in the destination revlog. The argument can have the

3655

are preserved in the destination revlog. The argument can have the

3656

following values:

3656

following values:

3657

3658

DELTAREUSEALWAYS

3658

DELTAREUSEALWAYS

3659

Deltas will always be reused (if possible), even if the destination

3659

Deltas will always be reused (if possible), even if the destination

3660

revlog would not select the same revisions for the delta. This is the

3660

revlog would not select the same revisions for the delta. This is the

3661

fastest mode of operation.

3661

fastest mode of operation.

3662

DELTAREUSESAMEREVS

3662

DELTAREUSESAMEREVS

3663

Deltas will be reused if the destination revlog would pick the same

3663

Deltas will be reused if the destination revlog would pick the same

3664

revisions for the delta. This mode strikes a balance between speed

3664

revisions for the delta. This mode strikes a balance between speed

3665

and optimization.

3665

and optimization.

3666

DELTAREUSENEVER

3666

DELTAREUSENEVER

3667

Deltas will never be reused. This is the slowest mode of execution.

3667

Deltas will never be reused. This is the slowest mode of execution.

3668

This mode can be used to recompute deltas (e.g. if the diff/delta

3668

This mode can be used to recompute deltas (e.g. if the diff/delta

3669

algorithm changes).

3669

algorithm changes).

3670

DELTAREUSEFULLADD

3670

DELTAREUSEFULLADD

3671

Revision will be re-added as if their were new content. This is

3671

Revision will be re-added as if their were new content. This is

3672

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3672

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3673

eg: large file detection and handling.

3673

eg: large file detection and handling.

3674

3675

Delta computation can be slow, so the choice of delta reuse policy can

3675

Delta computation can be slow, so the choice of delta reuse policy can

3676

significantly affect run time.

3676

significantly affect run time.

3677

3678

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3678

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3679

two extremes. Deltas will be reused if they are appropriate. But if the

3679

two extremes. Deltas will be reused if they are appropriate. But if the

3680

delta could choose a better revision, it will do so. This means if you

3680

delta could choose a better revision, it will do so. This means if you

3681

are converting a non-generaldelta revlog to a generaldelta revlog,

3681

are converting a non-generaldelta revlog to a generaldelta revlog,

3682

deltas will be recomputed if the delta's parent isn't a parent of the

3682

deltas will be recomputed if the delta's parent isn't a parent of the

3683

revision.

3683

revision.

3684

3685

In addition to the delta policy, the ``forcedeltabothparents``

3685

In addition to the delta policy, the ``forcedeltabothparents``

3686

argument controls whether to force compute deltas against both parents

3686

argument controls whether to force compute deltas against both parents

3687

for merges. By default, the current default is used.

3687

for merges. By default, the current default is used.

3688

3689

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3689

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3690

`sidedata_helpers`.

3690

`sidedata_helpers`.

3691

"""

3691

"""

3692

if deltareuse not in self.DELTAREUSEALL:

3692

if deltareuse not in self.DELTAREUSEALL:

3693

raise ValueError(

3693

raise ValueError(

3694

_(b'value for deltareuse invalid: %s') % deltareuse

3694

_(b'value for deltareuse invalid: %s') % deltareuse

3695

)

3695

)

3696

3697

if len(destrevlog):

3697

if len(destrevlog):

3698

raise ValueError(_(b'destination revlog is not empty'))

3698

raise ValueError(_(b'destination revlog is not empty'))

3699

3700

if getattr(self, 'filteredrevs', None):

3700

if getattr(self, 'filteredrevs', None):

3701

raise ValueError(_(b'source revlog has filtered revisions'))

3701

raise ValueError(_(b'source revlog has filtered revisions'))

3702

if getattr(destrevlog, 'filteredrevs', None):

3702

if getattr(destrevlog, 'filteredrevs', None):

3703

raise ValueError(_(b'destination revlog has filtered revisions'))

3703

raise ValueError(_(b'destination revlog has filtered revisions'))

3704

3705

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3705

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3706

# if possible.

3706

# if possible.

3707

old_delta_config = destrevlog.delta_config

3707

old_delta_config = destrevlog.delta_config

3708

destrevlog.delta_config = destrevlog.delta_config.copy()

3708

destrevlog.delta_config = destrevlog.delta_config.copy()

3709

3710

try:

3710

try:

3711

if deltareuse == self.DELTAREUSEALWAYS:

3711

if deltareuse == self.DELTAREUSEALWAYS:

3712

destrevlog.delta_config.lazy_delta_base = True

3712

destrevlog.delta_config.lazy_delta_base = True

3713

destrevlog.delta_config.lazy_delta = True

3713

destrevlog.delta_config.lazy_delta = True

3714

elif deltareuse == self.DELTAREUSESAMEREVS:

3714

elif deltareuse == self.DELTAREUSESAMEREVS:

3715

destrevlog.delta_config.lazy_delta_base = False

3715

destrevlog.delta_config.lazy_delta_base = False

3716

destrevlog.delta_config.lazy_delta = True

3716

destrevlog.delta_config.lazy_delta = True

3717

elif deltareuse == self.DELTAREUSENEVER:

3717

elif deltareuse == self.DELTAREUSENEVER:

3718

destrevlog.delta_config.lazy_delta_base = False

3718

destrevlog.delta_config.lazy_delta_base = False

3719

destrevlog.delta_config.lazy_delta = False

3719

destrevlog.delta_config.lazy_delta = False

3720

3721

delta_both_parents = (

3721

delta_both_parents = (

3722

forcedeltabothparents or old_delta_config.delta_both_parents

3722

forcedeltabothparents or old_delta_config.delta_both_parents

3723

)

3723

)

3724

destrevlog.delta_config.delta_both_parents = delta_both_parents

3724

destrevlog.delta_config.delta_both_parents = delta_both_parents

3725

3726

with self.reading(), destrevlog._writing(tr):

3726

with self.reading(), destrevlog._writing(tr):

3727

self._clone(

3727

self._clone(

3728

tr,

3728

tr,

3729

destrevlog,

3729

destrevlog,

3730

addrevisioncb,

3730

addrevisioncb,

3731

deltareuse,

3731

deltareuse,

3732

forcedeltabothparents,

3732

forcedeltabothparents,

3733

sidedata_helpers,

3733

sidedata_helpers,

3734

)

3734

)

3735

3736

finally:

3736

finally:

3737

destrevlog.delta_config = old_delta_config

3737

destrevlog.delta_config = old_delta_config

3738

3739

def _clone(

3739

def _clone(

3740

self,

3740

self,

3741

tr,

3741

tr,

3742

destrevlog,

3742

destrevlog,

3743

addrevisioncb,

3743

addrevisioncb,

3744

deltareuse,

3744

deltareuse,

3745

forcedeltabothparents,

3745

forcedeltabothparents,

3746

sidedata_helpers,

3746

sidedata_helpers,

3747

):

3747

):

3748

"""perform the core duty of `revlog.clone` after parameter processing"""

3748

"""perform the core duty of `revlog.clone` after parameter processing"""

3749

write_debug = None

3749

write_debug = None

3750

if self.delta_config.debug_delta:

3750

if self.delta_config.debug_delta:

3751

write_debug = tr._report

3751

write_debug = tr._report

3752

deltacomputer = deltautil.deltacomputer(

3752

deltacomputer = deltautil.deltacomputer(

3753

destrevlog,

3753

destrevlog,

3754

write_debug=write_debug,

3754

write_debug=write_debug,

3755

)

3755

)

3756

index = self.index

3756

index = self.index

3757

for rev in self:

3757

for rev in self:

3758

entry = index[rev]

3758

entry = index[rev]

3759

3760

# Some classes override linkrev to take filtered revs into

3760

# Some classes override linkrev to take filtered revs into

3761

# account. Use raw entry from index.

3761

# account. Use raw entry from index.

3762

flags = entry[0] & 0xFFFF

3762

flags = entry[0] & 0xFFFF

3763

linkrev = entry[4]

3763

linkrev = entry[4]

3764

p1 = index[entry[5]][7]

3764

p1 = index[entry[5]][7]

3765

p2 = index[entry[6]][7]

3765

p2 = index[entry[6]][7]

3766

node = entry[7]

3766

node = entry[7]

3767

3768

# (Possibly) reuse the delta from the revlog if allowed and

3768

# (Possibly) reuse the delta from the revlog if allowed and

3769

# the revlog chunk is a delta.

3769

# the revlog chunk is a delta.

3770

cachedelta = None

3770

cachedelta = None

3771

rawtext = None

3771

rawtext = None

3772

if deltareuse == self.DELTAREUSEFULLADD:

3772

if deltareuse == self.DELTAREUSEFULLADD:

3773

text = self._revisiondata(rev)

3773

text = self._revisiondata(rev)

3774

sidedata = self.sidedata(rev)

3774

sidedata = self.sidedata(rev)

3775

3776

if sidedata_helpers is not None:

3776

if sidedata_helpers is not None:

3777

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3777

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3778

self, sidedata_helpers, sidedata, rev

3778

self, sidedata_helpers, sidedata, rev

3779

)

3779

)

3780

flags = flags | new_flags[0] & ~new_flags[1]

3780

flags = flags | new_flags[0] & ~new_flags[1]

3781

3782

destrevlog.addrevision(

3782

destrevlog.addrevision(

3783

text,

3783

text,

3784

tr,

3784

tr,

3785

linkrev,

3785

linkrev,

3786

p1,

3786

p1,

3787

p2,

3787

p2,

3788

cachedelta=cachedelta,

3788

cachedelta=cachedelta,

3789

node=node,

3789

node=node,

3790

flags=flags,

3790

flags=flags,

3791

deltacomputer=deltacomputer,

3791

deltacomputer=deltacomputer,

3792

sidedata=sidedata,

3792

sidedata=sidedata,

3793

)

3793

)

3794

else:

3794

else:

3795

if destrevlog.delta_config.lazy_delta:

3795

if destrevlog.delta_config.lazy_delta:

3796

dp = self.deltaparent(rev)

3796

dp = self.deltaparent(rev)

3797

if dp != nullrev:

3797

if dp != nullrev:

3798

cachedelta = (dp, bytes(self._inner._chunk(rev)))

3798

cachedelta = (dp, bytes(self._inner._chunk(rev)))

3799

3800

sidedata = None

3800

sidedata = None

3801

if not cachedelta:

3801

if not cachedelta:

3802

try:

3802

try:

3803

rawtext = self._revisiondata(rev)

3803

rawtext = self._revisiondata(rev)

3804

except error.CensoredNodeError as censored:

3804

except error.CensoredNodeError as censored:

3805

assert flags & REVIDX_ISCENSORED

3805

assert flags & REVIDX_ISCENSORED

3806

rawtext = censored.tombstone

3806

rawtext = censored.tombstone

3807

sidedata = self.sidedata(rev)

3807

sidedata = self.sidedata(rev)

3808

if sidedata is None:

3808

if sidedata is None:

3809

sidedata = self.sidedata(rev)

3809

sidedata = self.sidedata(rev)

3810

3811

if sidedata_helpers is not None:

3811

if sidedata_helpers is not None:

3812

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3812

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3813

self, sidedata_helpers, sidedata, rev

3813

self, sidedata_helpers, sidedata, rev

3814

)

3814

)

3815

flags = flags | new_flags[0] & ~new_flags[1]

3815

flags = flags | new_flags[0] & ~new_flags[1]

3816

3817

destrevlog._addrevision(

3817

destrevlog._addrevision(

3818

node,

3818

node,

3819

rawtext,

3819

rawtext,

3820

tr,

3820

tr,

3821

linkrev,

3821

linkrev,

3822

p1,

3822

p1,

3823

p2,

3823

p2,

3824

flags,

3824

flags,

3825

cachedelta,

3825

cachedelta,

3826

deltacomputer=deltacomputer,

3826

deltacomputer=deltacomputer,

3827

sidedata=sidedata,

3827

sidedata=sidedata,

3828

)

3828

)

3829

3830

if addrevisioncb:

3830

if addrevisioncb:

3831

addrevisioncb(self, rev, node)

3831

addrevisioncb(self, rev, node)

3832

3833

def censorrevision(self, tr, censornode, tombstone=b''):

3833

def censorrevision(self, tr, censornode, tombstone=b''):

3834

if self._format_version == REVLOGV0:

3834

if self._format_version == REVLOGV0:

3835

raise error.RevlogError(

3835

raise error.RevlogError(

3836

_(b'cannot censor with version %d revlogs')

3836

_(b'cannot censor with version %d revlogs')

3837

% self._format_version

3837

% self._format_version

3838

)

3838

)

3839

elif self._format_version == REVLOGV1:

3839

elif self._format_version == REVLOGV1:

3840

rewrite.v1_censor(self, tr, censornode, tombstone)

3840

rewrite.v1_censor(self, tr, censornode, tombstone)

3841

else:

3841

else:

3842

rewrite.v2_censor(self, tr, censornode, tombstone)

3842

rewrite.v2_censor(self, tr, censornode, tombstone)

3843

3844

def verifyintegrity(self, state):

3844

def verifyintegrity(self, state):

3845

"""Verifies the integrity of the revlog.

3845

"""Verifies the integrity of the revlog.

3846

3847

Yields ``revlogproblem`` instances describing problems that are

3847

Yields ``revlogproblem`` instances describing problems that are

3848

found.

3848

found.

3849

"""

3849

"""

3850

dd, di = self.checksize()

3850

dd, di = self.checksize()

3851

if dd:

3851

if dd:

3852

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3852

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3853

if di:

3853

if di:

3854

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3854

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3855

3856

version = self._format_version

3856

version = self._format_version

3857

3858

# The verifier tells us what version revlog we should be.

3858

# The verifier tells us what version revlog we should be.

3859

if version != state[b'expectedversion']:

3859

if version != state[b'expectedversion']:

3860

yield revlogproblem(

3860

yield revlogproblem(

3861

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3861

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3862

% (self.display_id, version, state[b'expectedversion'])

3862

% (self.display_id, version, state[b'expectedversion'])

3863

)

3863

)

3864

3865

state[b'skipread'] = set()

3865

state[b'skipread'] = set()

3866

state[b'safe_renamed'] = set()

3866

state[b'safe_renamed'] = set()

3867

3868

for rev in self:

3868

for rev in self:

3869

node = self.node(rev)

3869

node = self.node(rev)

3870

3871

# Verify contents. 4 cases to care about:

3871

# Verify contents. 4 cases to care about:

3872

#

3872

#

3873

# common: the most common case

3873

# common: the most common case

3874

# rename: with a rename

3874

# rename: with a rename

3875

# meta: file content starts with b'\1\n', the metadata

3875

# meta: file content starts with b'\1\n', the metadata

3876

# header defined in filelog.py, but without a rename

3876

# header defined in filelog.py, but without a rename

3877

# ext: content stored externally

3877

# ext: content stored externally

3878

#

3878

#

3879

# More formally, their differences are shown below:

3879

# More formally, their differences are shown below:

3880

#

3880

#

3881

# | common | rename | meta | ext

3881

# | common | rename | meta | ext

3882

# -------------------------------------------------------

3882

# -------------------------------------------------------

3883

# flags() | 0 | 0 | 0 | not 0

3883

# flags() | 0 | 0 | 0 | not 0

3884

# renamed() | False | True | False | ?

3884

# renamed() | False | True | False | ?

3885

# rawtext[0:2]=='\1\n'| False | True | True | ?

3885

# rawtext[0:2]=='\1\n'| False | True | True | ?

3886

#

3886

#

3887

# "rawtext" means the raw text stored in revlog data, which

3887

# "rawtext" means the raw text stored in revlog data, which

3888

# could be retrieved by "rawdata(rev)". "text"

3888

# could be retrieved by "rawdata(rev)". "text"

3889

# mentioned below is "revision(rev)".

3889

# mentioned below is "revision(rev)".

3890

#

3890

#

3891

# There are 3 different lengths stored physically:

3891

# There are 3 different lengths stored physically:

3892

# 1. L1: rawsize, stored in revlog index

3892

# 1. L1: rawsize, stored in revlog index

3893

# 2. L2: len(rawtext), stored in revlog data

3893

# 2. L2: len(rawtext), stored in revlog data

3894

# 3. L3: len(text), stored in revlog data if flags==0, or

3894

# 3. L3: len(text), stored in revlog data if flags==0, or

3895

# possibly somewhere else if flags!=0

3895

# possibly somewhere else if flags!=0

3896

#

3896

#

3897

# L1 should be equal to L2. L3 could be different from them.

3897

# L1 should be equal to L2. L3 could be different from them.

3898

# "text" may or may not affect commit hash depending on flag

3898

# "text" may or may not affect commit hash depending on flag

3899

# processors (see flagutil.addflagprocessor).

3899

# processors (see flagutil.addflagprocessor).

3900

#

3900

#

3901

# | common | rename | meta | ext

3901

# | common | rename | meta | ext

3902

# -------------------------------------------------

3902

# -------------------------------------------------

3903

# rawsize() | L1 | L1 | L1 | L1

3903

# rawsize() | L1 | L1 | L1 | L1

3904

# size() | L1 | L2-LM | L1(*) | L1 (?)

3904

# size() | L1 | L2-LM | L1(*) | L1 (?)

3905

# len(rawtext) | L2 | L2 | L2 | L2

3905

# len(rawtext) | L2 | L2 | L2 | L2

3906

# len(text) | L2 | L2 | L2 | L3

3906

# len(text) | L2 | L2 | L2 | L3

3907

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3907

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3908

#

3908

#

3909

# LM: length of metadata, depending on rawtext

3909

# LM: length of metadata, depending on rawtext

3910

# (*): not ideal, see comment in filelog.size

3910

# (*): not ideal, see comment in filelog.size

3911

# (?): could be "- len(meta)" if the resolved content has

3911

# (?): could be "- len(meta)" if the resolved content has

3912

# rename metadata

3912

# rename metadata

3913

#

3913

#

3914

# Checks needed to be done:

3914

# Checks needed to be done:

3915

# 1. length check: L1 == L2, in all cases.

3915

# 1. length check: L1 == L2, in all cases.

3916

# 2. hash check: depending on flag processor, we may need to

3916

# 2. hash check: depending on flag processor, we may need to

3917

# use either "text" (external), or "rawtext" (in revlog).

3917

# use either "text" (external), or "rawtext" (in revlog).

3918

3919

try:

3919

try:

3920

skipflags = state.get(b'skipflags', 0)

3920

skipflags = state.get(b'skipflags', 0)

3921

if skipflags:

3921

if skipflags:

3922

skipflags &= self.flags(rev)

3922

skipflags &= self.flags(rev)

3923

3924

_verify_revision(self, skipflags, state, node)

3924

_verify_revision(self, skipflags, state, node)

3925

3926

l1 = self.rawsize(rev)

3926

l1 = self.rawsize(rev)

3927

l2 = len(self.rawdata(node))

3927

l2 = len(self.rawdata(node))

3928

3929

if l1 != l2:

3929

if l1 != l2:

3930

yield revlogproblem(

3930

yield revlogproblem(

3931

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3931

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3932

node=node,

3932

node=node,

3933

)

3933

)

3934

3935

except error.CensoredNodeError:

3935

except error.CensoredNodeError:

3936

if state[b'erroroncensored']:

3936

if state[b'erroroncensored']:

3937

yield revlogproblem(

3937

yield revlogproblem(

3938

error=_(b'censored file data'), node=node

3938

error=_(b'censored file data'), node=node

3939

)

3939

)

3940

state[b'skipread'].add(node)

3940

state[b'skipread'].add(node)

3941

except Exception as e:

3941

except Exception as e:

3942

yield revlogproblem(

3942

yield revlogproblem(

3943

error=_(b'unpacking %s: %s')

3943

error=_(b'unpacking %s: %s')

3944

% (short(node), stringutil.forcebytestr(e)),

3944

% (short(node), stringutil.forcebytestr(e)),

3945

node=node,

3945

node=node,

3946

)

3946

)

3947

state[b'skipread'].add(node)

3947

state[b'skipread'].add(node)

3948

3949

def storageinfo(

3949

def storageinfo(

3950

self,

3950

self,

3951

exclusivefiles=False,

3951

exclusivefiles=False,

3952

sharedfiles=False,

3952

sharedfiles=False,

3953

revisionscount=False,

3953

revisionscount=False,

3954

trackedsize=False,

3954

trackedsize=False,

3955

storedsize=False,

3955

storedsize=False,

3956

):

3956

):

3957

d = {}

3957

d = {}

3958

3959

if exclusivefiles:

3959

if exclusivefiles:

3960

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3960

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3961

if not self._inline:

3961

if not self._inline:

3962

d[b'exclusivefiles'].append((self.opener, self._datafile))

3962

d[b'exclusivefiles'].append((self.opener, self._datafile))

3963

3964

if sharedfiles:

3964

if sharedfiles:

3965

d[b'sharedfiles'] = []

3965

d[b'sharedfiles'] = []

3966

3967

if revisionscount:

3967

if revisionscount:

3968

d[b'revisionscount'] = len(self)

3968

d[b'revisionscount'] = len(self)

3969

3970

if trackedsize:

3970

if trackedsize:

3971

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3971

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3972

3973

if storedsize:

3973

if storedsize:

3974

d[b'storedsize'] = sum(

3974

d[b'storedsize'] = sum(

3975

self.opener.stat(path).st_size for path in self.files()

3975

self.opener.stat(path).st_size for path in self.files()

3976

)

3976

)

3977

3978

return d

3978

return d

3979

3980

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3980

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3981

if not self.feature_config.has_side_data:

3981

if not self.feature_config.has_side_data:

3982

return

3982

return

3983

# revlog formats with sidedata support does not support inline

3983

# revlog formats with sidedata support does not support inline

3984

assert not self._inline

3984

assert not self._inline

3985

if not helpers[1] and not helpers[2]:

3985

if not helpers[1] and not helpers[2]:

3986

# Nothing to generate or remove

3986

# Nothing to generate or remove

3987

return

3987

return

3988

3989

new_entries = []

3989

new_entries = []

3990

# append the new sidedata

3990

# append the new sidedata

3991

with self._writing(transaction):

3991

with self._writing(transaction):

3992

ifh, dfh, sdfh = self._inner._writinghandles

3992

ifh, dfh, sdfh = self._inner._writinghandles

3993

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3993

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3994

3995

current_offset = sdfh.tell()

3995

current_offset = sdfh.tell()

3996

for rev in range(startrev, endrev + 1):

3996

for rev in range(startrev, endrev + 1):

3997

entry = self.index[rev]

3997

entry = self.index[rev]

3998

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

3998

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

3999

store=self,

3999

store=self,

4000

sidedata_helpers=helpers,

4000

sidedata_helpers=helpers,

4001

sidedata={},

4001

sidedata={},

4002

rev=rev,

4002

rev=rev,

4003

)

4003

)

4004

4005

serialized_sidedata = sidedatautil.serialize_sidedata(

4005

serialized_sidedata = sidedatautil.serialize_sidedata(

4006

new_sidedata

4006

new_sidedata

4007

)

4007

)

4008

4009

sidedata_compression_mode = COMP_MODE_INLINE

4009

sidedata_compression_mode = COMP_MODE_INLINE

4010

if serialized_sidedata and self.feature_config.has_side_data:

4010

if serialized_sidedata and self.feature_config.has_side_data:

4011

sidedata_compression_mode = COMP_MODE_PLAIN

4011

sidedata_compression_mode = COMP_MODE_PLAIN

4012

h, comp_sidedata = self._inner.compress(serialized_sidedata)

4012

h, comp_sidedata = self._inner.compress(serialized_sidedata)

4013

if (

4013

if (

4014

h != b'u'

4014

h != b'u'

4015

and comp_sidedata[0] != b'\0'

4015

and comp_sidedata[0] != b'\0'

4016

and len(comp_sidedata) < len(serialized_sidedata)

4016

and len(comp_sidedata) < len(serialized_sidedata)

4017

):

4017

):

4018

assert not h

4018

assert not h

4019

if (

4019

if (

4020

comp_sidedata[0]

4020

comp_sidedata[0]

4021

== self._docket.default_compression_header

4021

== self._docket.default_compression_header

4022

):

4022

):

4023

sidedata_compression_mode = COMP_MODE_DEFAULT

4023

sidedata_compression_mode = COMP_MODE_DEFAULT

4024

serialized_sidedata = comp_sidedata

4024

serialized_sidedata = comp_sidedata

4025

else:

4025

else:

4026

sidedata_compression_mode = COMP_MODE_INLINE

4026

sidedata_compression_mode = COMP_MODE_INLINE

4027

serialized_sidedata = comp_sidedata

4027

serialized_sidedata = comp_sidedata

4028

if entry[8] != 0 or entry[9] != 0:

4028

if entry[8] != 0 or entry[9] != 0:

4029

# rewriting entries that already have sidedata is not

4029

# rewriting entries that already have sidedata is not

4030

# supported yet, because it introduces garbage data in the

4030

# supported yet, because it introduces garbage data in the

4031

# revlog.

4031

# revlog.

4032

msg = b"rewriting existing sidedata is not supported yet"

4032

msg = b"rewriting existing sidedata is not supported yet"

4033

raise error.Abort(msg)

4033

raise error.Abort(msg)

4034

4035

# Apply (potential) flags to add and to remove after running

4035

# Apply (potential) flags to add and to remove after running

4036

# the sidedata helpers

4036

# the sidedata helpers

4037

new_offset_flags = entry[0] | flags[0] & ~flags[1]

4037

new_offset_flags = entry[0] | flags[0] & ~flags[1]

4038

entry_update = (

4038

entry_update = (

4039

current_offset,

4039

current_offset,

4040

len(serialized_sidedata),

4040

len(serialized_sidedata),

4041

new_offset_flags,

4041

new_offset_flags,

4042

sidedata_compression_mode,

4042

sidedata_compression_mode,

4043

)

4043

)

4044

4045

# the sidedata computation might have move the file cursors around

4045

# the sidedata computation might have move the file cursors around

4046

sdfh.seek(current_offset, os.SEEK_SET)

4046

sdfh.seek(current_offset, os.SEEK_SET)

4047

sdfh.write(serialized_sidedata)

4047

sdfh.write(serialized_sidedata)

4048

new_entries.append(entry_update)

4048

new_entries.append(entry_update)

4049

current_offset += len(serialized_sidedata)

4049

current_offset += len(serialized_sidedata)

4050

self._docket.sidedata_end = sdfh.tell()

4050

self._docket.sidedata_end = sdfh.tell()

4051

4052

# rewrite the new index entries

4052

# rewrite the new index entries

4053

ifh.seek(startrev * self.index.entry_size)

4053

ifh.seek(startrev * self.index.entry_size)

4054

for i, e in enumerate(new_entries):

4054

for i, e in enumerate(new_entries):

4055

rev = startrev + i

4055

rev = startrev + i

4056

self.index.replace_sidedata_info(rev, *e)

4056

self.index.replace_sidedata_info(rev, *e)

4057

packed = self.index.entry_binary(rev)

4057

packed = self.index.entry_binary(rev)

4058

if rev == 0 and self._docket is None:

4058

if rev == 0 and self._docket is None:

4059

header = self._format_flags | self._format_version

4059

header = self._format_flags | self._format_version

4060

header = self.index.pack_header(header)

4060

header = self.index.pack_header(header)

4061

packed = header + packed

4061

packed = header + packed

4062

ifh.write(packed)

4062

ifh.write(packed)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             # coding: utf8
             #
             # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             import binascii
             import collections
             import contextlib
             import functools
             import io
             import os
             import struct
             import weakref
             import zlib
             # import stuff from node for others to import from revlog
             from .node import (
                 bin,
                 hex,
                 nullrev,
                 sha1nodeconstants,
                 short,
                 wdirrev,
             )
             from .i18n import _
             from .revlogutils.constants import (
                 ALL_KINDS,
                 CHANGELOGV2,
                 COMP_MODE_DEFAULT,
                 COMP_MODE_INLINE,
                 COMP_MODE_PLAIN,
                 DELTA_BASE_REUSE_NO,
                 DELTA_BASE_REUSE_TRY,
                 ENTRY_RANK,
                 FEATURES_BY_VERSION,
                 FLAG_GENERALDELTA,
                 FLAG_INLINE_DATA,
                 INDEX_HEADER,
                 KIND_CHANGELOG,
                 KIND_FILELOG,
                 RANK_UNKNOWN,
                 REVLOGV0,
                 REVLOGV1,
                 REVLOGV1_FLAGS,
                 REVLOGV2,
                 REVLOGV2_FLAGS,
                 REVLOG_DEFAULT_FLAGS,
                 REVLOG_DEFAULT_FORMAT,
                 REVLOG_DEFAULT_VERSION,
                 SUPPORTED_FLAGS,
             )
             from .revlogutils.flagutil import (
                 REVIDX_DEFAULT_FLAGS,
                 REVIDX_ELLIPSIS,
                 REVIDX_EXTSTORED,
                 REVIDX_FLAGS_ORDER,
                 REVIDX_HASCOPIESINFO,
                 REVIDX_ISCENSORED,
                 REVIDX_RAWTEXT_CHANGING_FLAGS,
             )
             from .thirdparty import attr
             from . import (
                 ancestor,
                 dagop,
                 error,
                 mdiff,
                 policy,
                 pycompat,
                 revlogutils,
                 templatefilters,
                 util,
             )
             from .interfaces import (
                 repository,
                 util as interfaceutil,
             )
             from .revlogutils import (
                 deltas as deltautil,
                 docket as docketutil,
                 flagutil,
                 nodemap as nodemaputil,
                 randomaccessfile,
                 revlogv0,
                 rewrite,
                 sidedata as sidedatautil,
             )
             from .utils import (
                 storageutil,
                 stringutil,
             )
             # blanked usage of all the name to prevent pyflakes constraints
             # We need these name available in the module for extensions.
             REVLOGV0
             REVLOGV1
             REVLOGV2
             CHANGELOGV2
             FLAG_INLINE_DATA
             FLAG_GENERALDELTA
             REVLOG_DEFAULT_FLAGS
             REVLOG_DEFAULT_FORMAT
             REVLOG_DEFAULT_VERSION
             REVLOGV1_FLAGS
             REVLOGV2_FLAGS
             REVIDX_ISCENSORED
             REVIDX_ELLIPSIS
             REVIDX_HASCOPIESINFO
             REVIDX_EXTSTORED
             REVIDX_DEFAULT_FLAGS
             REVIDX_FLAGS_ORDER
             REVIDX_RAWTEXT_CHANGING_FLAGS
             parsers = policy.importmod('parsers')
             rustancestor = policy.importrust('ancestor')
             rustdagop = policy.importrust('dagop')
             rustrevlog = policy.importrust('revlog')
             # Aliased for performance.
             _zlibdecompress = zlib.decompress
             # max size of inline data embedded into a revlog
             _maxinline = 131072
             # Flag processors for REVIDX_ELLIPSIS.
             def ellipsisreadprocessor(rl, text):
                 return text, False
             def ellipsiswriteprocessor(rl, text):
                 return text, False
             def ellipsisrawprocessor(rl, text):
                 return False
             ellipsisprocessor = (
                 ellipsisreadprocessor,
                 ellipsiswriteprocessor,
                 ellipsisrawprocessor,
             )
             def _verify_revision(rl, skipflags, state, node):
                 """Verify the integrity of the given revlog ``node`` while providing a hook
                 point for extensions to influence the operation."""
                 if skipflags:
                     state[b'skipread'].add(node)
                 else:
                     # Side-effect: read content and verify hash.
                     rl.revision(node)
             # True if a fast implementation for persistent-nodemap is available
             #
             # We also consider we have a "fast" implementation in "pure" python because
             # people using pure don't really have performance consideration (and a
             # wheelbarrow of other slowness source)
             HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(
                 parsers, 'BaseIndexObject'
             )
             @interfaceutil.implementer(repository.irevisiondelta)
             @attr.s(slots=True)
             class revlogrevisiondelta:
                 node = attr.ib()
                 p1node = attr.ib()
                 p2node = attr.ib()
                 basenode = attr.ib()
                 flags = attr.ib()
                 baserevisionsize = attr.ib()
                 revision = attr.ib()
                 delta = attr.ib()
                 sidedata = attr.ib()
                 protocol_flags = attr.ib()
                 linknode = attr.ib(default=None)
             @interfaceutil.implementer(repository.iverifyproblem)
             @attr.s(frozen=True)
             class revlogproblem:
                 warning = attr.ib(default=None)
                 error = attr.ib(default=None)
                 node = attr.ib(default=None)
             def parse_index_v1(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline)
                 return index, cache
             def parse_index_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)
                 return index, cache
             def parse_index_cl_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)
                 return index, cache
             if hasattr(parsers, 'parse_index_devel_nodemap'):
                 def parse_index_v1_nodemap(data, inline):
                     index, cache = parsers.parse_index_devel_nodemap(data, inline)
                     return index, cache
             else:
                 parse_index_v1_nodemap = None
-            def parse_index_v1_mixed(data, inline, default_header):
+            def parse_index_v1_rust(data, inline, default_header):
                 cache = (0, data) if inline else None
-                return rustrevlog.MixedIndex(data, default_header), cache
+                return rustrevlog.Index(data, default_header), cache
             # corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
             # signed integer)
             _maxentrysize = 0x7FFFFFFF
             FILE_TOO_SHORT_MSG = _(
                 b'cannot read from revlog %s;'
                 b'  expected %d bytes from offset %d, data size is %d'
             )
             hexdigits = b'0123456789abcdefABCDEF'
             class _Config:
                 def copy(self):
                     return self.__class__(**self.__dict__)
             @attr.s()
             class FeatureConfig(_Config):
                 """Hold configuration values about the available revlog features"""
                 # the default compression engine
                 compression_engine = attr.ib(default=b'zlib')
                 # compression engines options
                 compression_engine_options = attr.ib(default=attr.Factory(dict))
                 # can we use censor on this revlog
                 censorable = attr.ib(default=False)
                 # does this revlog use the "side data" feature
                 has_side_data = attr.ib(default=False)
                 # might remove rank configuration once the computation has no impact
                 compute_rank = attr.ib(default=False)
                 # parent order is supposed to be semantically irrelevant, so we
                 # normally resort parents to ensure that the first parent is non-null,
                 # if there is a non-null parent at all.
                 # filelog abuses the parent order as flag to mark some instances of
                 # meta-encoded files, so allow it to disable this behavior.
                 canonical_parent_order = attr.ib(default=False)
                 # can ellipsis commit be used
                 enable_ellipsis = attr.ib(default=False)
                 def copy(self):
                     new = super().copy()
                     new.compression_engine_options = self.compression_engine_options.copy()
                     return new
             @attr.s()
             class DataConfig(_Config):
                 """Hold configuration value about how the revlog data are read"""
                 # should we try to open the "pending" version of the revlog
                 try_pending = attr.ib(default=False)
                 # should we try to open the "splitted" version of the revlog
                 try_split = attr.ib(default=False)
                 #  When True, indexfile should be opened with checkambig=True at writing,
                 #  to avoid file stat ambiguity.
                 check_ambig = attr.ib(default=False)
                 # If true, use mmap instead of reading to deal with large index
                 mmap_large_index = attr.ib(default=False)
                 # how much data is large
                 mmap_index_threshold = attr.ib(default=None)
                 # How much data to read and cache into the raw revlog data cache.
                 chunk_cache_size = attr.ib(default=65536)
                 # The size of the uncompressed cache compared to the largest revision seen.
                 uncompressed_cache_factor = attr.ib(default=None)
                 # The number of chunk cached
                 uncompressed_cache_count = attr.ib(default=None)
                 # Allow sparse reading of the revlog data
                 with_sparse_read = attr.ib(default=False)
                 # minimal density of a sparse read chunk
                 sr_density_threshold = attr.ib(default=0.50)
                 # minimal size of data we skip when performing sparse read
                 sr_min_gap_size = attr.ib(default=262144)
                 # are delta encoded against arbitrary bases.
                 generaldelta = attr.ib(default=False)
             @attr.s()
             class DeltaConfig(_Config):
                 """Hold configuration value about how new delta are computed
                 Some attributes are duplicated from DataConfig to help havign each object
                 self contained.
                 """
                 # can delta be encoded against arbitrary bases.
                 general_delta = attr.ib(default=False)
                 # Allow sparse writing of the revlog data
                 sparse_revlog = attr.ib(default=False)
                 # maximum length of a delta chain
                 max_chain_len = attr.ib(default=None)
                 # Maximum distance between delta chain base start and end
                 max_deltachain_span = attr.ib(default=-1)
                 # If `upper_bound_comp` is not None, this is the expected maximal gain from
                 # compression for the data content.
                 upper_bound_comp = attr.ib(default=None)
                 # Should we try a delta against both parent
                 delta_both_parents = attr.ib(default=True)
                 # Test delta base candidate group by chunk of this maximal size.
                 candidate_group_chunk_size = attr.ib(default=0)
                 # Should we display debug information about delta computation
                 debug_delta = attr.ib(default=False)
                 # trust incoming delta by default
                 lazy_delta = attr.ib(default=True)
                 # trust the base of incoming delta by default
                 lazy_delta_base = attr.ib(default=False)
             class _InnerRevlog:
                 """An inner layer of the revlog object
                 That layer exist to be able to delegate some operation to Rust, its
                 boundaries are arbitrary and based on what we can delegate to Rust.
                 """
                 def __init__(
                     self,
                     opener,
                     index,
                     index_file,
                     data_file,
                     sidedata_file,
                     inline,
                     data_config,
                     delta_config,
                     feature_config,
                     chunk_cache,
                     default_compression_header,
                 ):
                     self.opener = opener
                     self.index = index
                     self.index_file = index_file
                     self.data_file = data_file
                     self.sidedata_file = sidedata_file
                     self.inline = inline
                     self.data_config = data_config
                     self.delta_config = delta_config
                     self.feature_config = feature_config
                     # used during diverted write.
                     self._orig_index_file = None
                     self._default_compression_header = default_compression_header
                     # index
                     # 3-tuple of file handles being used for active writing.
                     self._writinghandles = None
                     self._segmentfile = randomaccessfile.randomaccessfile(
                         self.opener,
                         (self.index_file if self.inline else self.data_file),
                         self.data_config.chunk_cache_size,
                         chunk_cache,
                     )
                     self._segmentfile_sidedata = randomaccessfile.randomaccessfile(
                         self.opener,
                         self.sidedata_file,
                         self.data_config.chunk_cache_size,
                     )
                     # revlog header -> revlog compressor
                     self._decompressors = {}
                     # 3-tuple of (node, rev, text) for a raw revision.
                     self._revisioncache = None
                     # cache some uncompressed chunks
                     # rev → uncompressed_chunk
                     #
                     # the max cost is dynamically updated to be proportionnal to the
                     # size of revision we actually encounter.
                     self._uncompressed_chunk_cache = None
                     if self.data_config.uncompressed_cache_factor is not None:
                         self._uncompressed_chunk_cache = util.lrucachedict(
                             self.data_config.uncompressed_cache_count,
                             maxcost=65536,  # some arbitrary initial value
                         )
                     self._delay_buffer = None
                 def __len__(self):
                     return len(self.index)
                 def clear_cache(self):
                     assert not self.is_delaying
                     self._revisioncache = None
                     if self._uncompressed_chunk_cache is not None:
                         self._uncompressed_chunk_cache.clear()
                     self._segmentfile.clear_cache()
                     self._segmentfile_sidedata.clear_cache()
                 @property
                 def canonical_index_file(self):
                     if self._orig_index_file is not None:
                         return self._orig_index_file
                     return self.index_file
                 @property
                 def is_delaying(self):
                     """is the revlog is currently delaying the visibility of written data?
                     The delaying mechanism can be either in-memory or written on disk in a
                     side-file."""
                     return (self._delay_buffer is not None) or (
                         self._orig_index_file is not None
                     )
                 # Derived from index values.
                 def start(self, rev):
                     """the offset of the data chunk for this revision"""
                     return int(self.index[rev][0] >> 16)
                 def length(self, rev):
                     """the length of the data chunk for this revision"""
                     return self.index[rev][1]
                 def end(self, rev):
                     """the end of the data chunk for this revision"""
                     return self.start(rev) + self.length(rev)
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self.delta_config.general_delta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     if not self.delta_config.sparse_revlog:
                         return self.deltaparent(rev) == nullrev
                     elif hasattr(self.index, 'issnapshot'):
                         # directly assign the method to cache the testing and access
                         self.issnapshot = self.index.issnapshot
                         return self.issnapshot(rev)
                     if rev == nullrev:
                         return True
                     entry = self.index[rev]
                     base = entry[3]
                     if base == rev:
                         return True
                     if base == nullrev:
                         return True
                     p1 = entry[5]
                     while self.length(p1) == 0:
                         b = self.deltaparent(p1)
                         if b == p1:
                             break
                         p1 = b
                     p2 = entry[6]
                     while self.length(p2) == 0:
                         b = self.deltaparent(p2)
                         if b == p2:
                             break
                         p2 = b
                     if base == p1 or base == p2:
                         return False
                     return self.issnapshot(base)
                 def _deltachain(self, rev, stoprev=None):
                     """Obtain the delta chain for a revision.
                     ``stoprev`` specifies a revision to stop at. If not specified, we
                     stop at the base of the chain.
                     Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
                     revs in ascending order and ``stopped`` is a bool indicating whether
                     ``stoprev`` was hit.
                     """
                     generaldelta = self.delta_config.general_delta
                     # Try C implementation.
                     try:
                         return self.index.deltachain(rev, stoprev, generaldelta)
                     except AttributeError:
                         pass
                     chain = []
                     # Alias to prevent attribute lookup in tight loop.
                     index = self.index
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != stoprev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == stoprev:
                         stopped = True
                     else:
                         chain.append(iterrev)
                         stopped = False
                     chain.reverse()
                     return chain, stopped
                 @util.propertycache
                 def _compressor(self):
                     engine = util.compengines[self.feature_config.compression_engine]
                     return engine.revlogcompressor(
                         self.feature_config.compression_engine_options
                     )
                 @util.propertycache
                 def _decompressor(self):
                     """the default decompressor"""
                     if self._default_compression_header is None:
                         return None
                     t = self._default_compression_header
                     c = self._get_decompressor(t)
                     return c.decompress
                 def _get_decompressor(self, t):
                     try:
                         compressor = self._decompressors[t]
                     except KeyError:
                         try:
                             engine = util.compengines.forrevlogheader(t)
                             compressor = engine.revlogcompressor(
                                 self.feature_config.compression_engine_options
                             )
                             self._decompressors[t] = compressor
                         except KeyError:
                             raise error.RevlogError(
                                 _(b'unknown compression type %s') % binascii.hexlify(t)
                             )
                     return compressor
                 def compress(self, data):
                     """Generate a possibly-compressed representation of data."""
                     if not data:
                         return b'', data
                     compressed = self._compressor.compress(data)
                     if compressed:
                         # The revlog compressor added the header in the returned data.
                         return b'', compressed
                     if data[0:1] == b'\0':
                         return b'', data
                     return b'u', data
                 def decompress(self, data):
                     """Decompress a revlog chunk.
                     The chunk is expected to begin with a header identifying the
                     format type so it can be routed to an appropriate decompressor.
                     """
                     if not data:
                         return data
                     # Revlogs are read much more frequently than they are written and many
                     # chunks only take microseconds to decompress, so performance is
                     # important here.
                     #
                     # We can make a few assumptions about revlogs:
                     #
                     # 1) the majority of chunks will be compressed (as opposed to inline
                     #    raw data).
                     # 2) decompressing *any* data will likely by at least 10x slower than
                     #    returning raw inline data.
                     # 3) we want to prioritize common and officially supported compression
                     #    engines
                     #
                     # It follows that we want to optimize for "decompress compressed data
                     # when encoded with common and officially supported compression engines"
                     # case over "raw data" and "data encoded by less common or non-official
                     # compression engines." That is why we have the inline lookup first
                     # followed by the compengines lookup.
                     #
                     # According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
                     # compressed chunks. And this matters for changelog and manifest reads.
                     t = data[0:1]
                     if t == b'x':
                         try:
                             return _zlibdecompress(data)
                         except zlib.error as e:
                             raise error.RevlogError(
                                 _(b'revlog decompress error: %s')
                                 % stringutil.forcebytestr(e)
                             )
                     # '\0' is more common than 'u' so it goes first.
                     elif t == b'\0':
                         return data
                     elif t == b'u':
                         return util.buffer(data, 1)
                     compressor = self._get_decompressor(t)
                     return compressor.decompress(data)
                 @contextlib.contextmanager
                 def reading(self):
                     """Context manager that keeps data and sidedata files open for reading"""
                     if len(self.index) == 0:
                         yield  # nothing to be read
                     elif self._delay_buffer is not None and self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     else:
                         with self._segmentfile.reading():
                             with self._segmentfile_sidedata.reading():
                                 yield
                 @property
                 def is_writing(self):
                     """True is a writing context is open"""
                     return self._writinghandles is not None
                 @property
                 def is_open(self):
                     """True if any file handle is being held
                     Used for assert and debug in the python code"""
                     return self._segmentfile.is_open or self._segmentfile_sidedata.is_open
                 @contextlib.contextmanager
                 def writing(self, transaction, data_end=None, sidedata_end=None):
                     """Open the revlog files for writing
                     Add content to a revlog should be done within such context.
                     """
                     if self.is_writing:
                         yield
                     else:
                         ifh = dfh = sdfh = None
                         try:
                             r = len(self.index)
                             # opening the data file.
                             dsize = 0
                             if r:
                                 dsize = self.end(r - 1)
                             dfh = None
                             if not self.inline:
                                 try:
                                     dfh = self.opener(self.data_file, mode=b"r+")
                                     if data_end is None:
                                         dfh.seek(0, os.SEEK_END)
                                     else:
                                         dfh.seek(data_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     dfh = self.opener(self.data_file, mode=b"w+")
                                 transaction.add(self.data_file, dsize)
                             if self.sidedata_file is not None:
                                 assert sidedata_end is not None
                                 # revlog-v2 does not inline, help Pytype
                                 assert dfh is not None
                                 try:
                                     sdfh = self.opener(self.sidedata_file, mode=b"r+")
                                     dfh.seek(sidedata_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     sdfh = self.opener(self.sidedata_file, mode=b"w+")
                                 transaction.add(self.sidedata_file, sidedata_end)
                             # opening the index file.
                             isize = r * self.index.entry_size
                             ifh = self.__index_write_fp()
                             if self.inline:
                                 transaction.add(self.index_file, dsize + isize)
                             else:
                                 transaction.add(self.index_file, isize)
                             # exposing all file handle for writing.
                             self._writinghandles = (ifh, dfh, sdfh)
                             self._segmentfile.writing_handle = ifh if self.inline else dfh
                             self._segmentfile_sidedata.writing_handle = sdfh
                             yield
                         finally:
                             self._writinghandles = None
                             self._segmentfile.writing_handle = None
                             self._segmentfile_sidedata.writing_handle = None
                             if dfh is not None:
                                 dfh.close()
                             if sdfh is not None:
                                 sdfh.close()
                             # closing the index file last to avoid exposing referent to
                             # potential unflushed data content.
                             if ifh is not None:
                                 ifh.close()
                 def __index_write_fp(self, index_end=None):
                     """internal method to open the index file for writing
                     You should not use this directly and use `_writing` instead
                     """
                     try:
                         if self._delay_buffer is None:
                             f = self.opener(
                                 self.index_file,
                                 mode=b"r+",
                                 checkambig=self.data_config.check_ambig,
                             )
                         else:
                             # check_ambig affect we way we open file for writing, however
                             # here, we do not actually open a file for writting as write
                             # will appened to a delay_buffer. So check_ambig is not
                             # meaningful and unneeded here.
                             f = randomaccessfile.appender(
                                 self.opener, self.index_file, b"r+", self._delay_buffer
                             )
                         if index_end is None:
                             f.seek(0, os.SEEK_END)
                         else:
                             f.seek(index_end, os.SEEK_SET)
                         return f
                     except FileNotFoundError:
                         if self._delay_buffer is None:
                             return self.opener(
                                 self.index_file,
                                 mode=b"w+",
                                 checkambig=self.data_config.check_ambig,
                             )
                         else:
                             return randomaccessfile.appender(
                                 self.opener, self.index_file, b"w+", self._delay_buffer
                             )
                 def __index_new_fp(self):
                     """internal method to create a new index file for writing
                     You should not use this unless you are upgrading from inline revlog
                     """
                     return self.opener(
                         self.index_file,
                         mode=b"w",
                         checkambig=self.data_config.check_ambig,
                         atomictemp=True,
                     )
                 def split_inline(self, tr, header, new_index_file_path=None):
                     """split the data of an inline revlog into an index and a data file"""
                     assert self._delay_buffer is None
                     existing_handles = False
                     if self._writinghandles is not None:
                         existing_handles = True
                         fp = self._writinghandles[0]
                         fp.flush()
                         fp.close()
                         # We can't use the cached file handle after close(). So prevent
                         # its usage.
                         self._writinghandles = None
                         self._segmentfile.writing_handle = None
                         # No need to deal with sidedata writing handle as it is only
                         # relevant with revlog-v2 which is never inline, not reaching
                         # this code
                     new_dfh = self.opener(self.data_file, mode=b"w+")
                     new_dfh.truncate(0)  # drop any potentially existing data
                     try:
                         with self.reading():
                             for r in range(len(self.index)):
                                 new_dfh.write(self.get_segment_for_revs(r, r)[1])
                             new_dfh.flush()
                         if new_index_file_path is not None:
                             self.index_file = new_index_file_path
                         with self.__index_new_fp() as fp:
                             self.inline = False
                             for i in range(len(self.index)):
                                 e = self.index.entry_binary(i)
                                 if i == 0:
                                     packed_header = self.index.pack_header(header)
                                     e = packed_header + e
                                 fp.write(e)
                             # If we don't use side-write, the temp file replace the real
                             # index when we exit the context manager
                         self._segmentfile = randomaccessfile.randomaccessfile(
                             self.opener,
                             self.data_file,
                             self.data_config.chunk_cache_size,
                         )
                         if existing_handles:
                             # switched from inline to conventional reopen the index
                             ifh = self.__index_write_fp()
                             self._writinghandles = (ifh, new_dfh, None)
                             self._segmentfile.writing_handle = new_dfh
                             new_dfh = None
                             # No need to deal with sidedata writing handle as it is only
                             # relevant with revlog-v2 which is never inline, not reaching
                             # this code
                     finally:
                         if new_dfh is not None:
                             new_dfh.close()
                     return self.index_file
                 def get_segment_for_revs(self, startrev, endrev):
                     """Obtain a segment of raw data corresponding to a range of revisions.
                     Accepts the start and end revisions and an optional already-open
                     file handle to be used for reading. If the file handle is read, its
                     seek position will not be preserved.
                     Requests for data may be satisfied by a cache.
                     Returns a 2-tuple of (offset, data) for the requested range of
                     revisions. Offset is the integer offset from the beginning of the
                     revlog and data is a str or buffer of the raw byte data.
                     Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
                     to determine where each revision's data begins and ends.
                     API: we should consider making this a private part of the InnerRevlog
                     at some point.
                     """
                     # Inlined self.start(startrev) & self.end(endrev) for perf reasons
                     # (functions are expensive).
                     index = self.index
                     istart = index[startrev]
                     start = int(istart[0] >> 16)
                     if startrev == endrev:
                         end = start + istart[1]
                     else:
                         iend = index[endrev]
                         end = int(iend[0] >> 16) + iend[1]
                     if self.inline:
                         start += (startrev + 1) * self.index.entry_size
                         end += (endrev + 1) * self.index.entry_size
                     length = end - start
                     return start, self._segmentfile.read_chunk(start, length)
                 def _chunk(self, rev):
                     """Obtain a single decompressed chunk for a revision.
                     Accepts an integer revision and an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will not
                     be preserved.
                     Returns a str holding uncompressed data for the requested revision.
                     """
                     if self._uncompressed_chunk_cache is not None:
                         uncomp = self._uncompressed_chunk_cache.get(rev)
                         if uncomp is not None:
                             return uncomp
                     compression_mode = self.index[rev][10]
                     data = self.get_segment_for_revs(rev, rev)[1]
                     if compression_mode == COMP_MODE_PLAIN:
                         uncomp = data
                     elif compression_mode == COMP_MODE_DEFAULT:
                         uncomp = self._decompressor(data)
                     elif compression_mode == COMP_MODE_INLINE:
                         uncomp = self.decompress(data)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= compression_mode
                         raise error.RevlogError(msg)
                     if self._uncompressed_chunk_cache is not None:
                         self._uncompressed_chunk_cache.insert(rev, uncomp, cost=len(uncomp))
                     return uncomp
                 def _chunks(self, revs, targetsize=None):
                     """Obtain decompressed chunks for the specified revisions.
                     Accepts an iterable of numeric revisions that are assumed to be in
                     ascending order. Also accepts an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will
                     not be preserved.
                     This function is similar to calling ``self._chunk()`` multiple times,
                     but is faster.
                     Returns a list with decompressed data for each requested revision.
                     """
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self.inline
                     iosize = self.index.entry_size
                     buffer = util.buffer
                     fetched_revs = []
                     fadd = fetched_revs.append
                     chunks = []
                     ladd = chunks.append
                     if self._uncompressed_chunk_cache is None:
                         fetched_revs = revs
                     else:
                         for rev in revs:
                             cached_value = self._uncompressed_chunk_cache.get(rev)
                             if cached_value is None:
                                 fadd(rev)
                             else:
                                 ladd((rev, cached_value))
                     if not fetched_revs:
                         slicedchunks = ()
                     elif not self.data_config.with_sparse_read:
                         slicedchunks = (fetched_revs,)
                     else:
                         slicedchunks = deltautil.slicechunk(
                             self,
                             fetched_revs,
                             targetsize=targetsize,
                         )
                     for revschunk in slicedchunks:
                         firstrev = revschunk[0]
                         # Skip trailing revisions with empty diff
                         for lastrev in revschunk[::-1]:
                             if length(lastrev) != 0:
                                 break
                         try:
                             offset, data = self.get_segment_for_revs(firstrev, lastrev)
                         except OverflowError:
                             # issue4215 - we can't cache a run of chunks greater than
                             # 2G on Windows
                             for rev in revschunk:
                                 ladd((rev, self._chunk(rev)))
                         decomp = self.decompress
                         # self._decompressor might be None, but will not be used in that case
                         def_decomp = self._decompressor
                         for rev in revschunk:
                             chunkstart = start(rev)
                             if inline:
                                 chunkstart += (rev + 1) * iosize
                             chunklength = length(rev)
                             comp_mode = self.index[rev][10]
                             c = buffer(data, chunkstart - offset, chunklength)
                             if comp_mode == COMP_MODE_PLAIN:
                                 c = c
                             elif comp_mode == COMP_MODE_INLINE:
                                 c = decomp(c)
                             elif comp_mode == COMP_MODE_DEFAULT:
                                 c = def_decomp(c)
                             else:
                                 msg = b'unknown compression mode %d'
                                 msg %= comp_mode
                                 raise error.RevlogError(msg)
                             ladd((rev, c))
                             if self._uncompressed_chunk_cache is not None:
                                 self._uncompressed_chunk_cache.insert(rev, c, len(c))
                     chunks.sort()
                     return [x[1] for x in chunks]
                 def raw_text(self, node, rev):
                     """return the possibly unvalidated rawtext for a revision
                     returns (rev, rawtext, validated)
                     """
                     # revision in the cache (could be useful to apply delta)
                     cachedrev = None
                     # An intermediate text to apply deltas to
                     basetext = None
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._revisioncache:
                         cachedrev = self._revisioncache[1]
                     chain, stopped = self._deltachain(rev, stoprev=cachedrev)
                     if stopped:
                         basetext = self._revisioncache[2]
                     # drop cache to save memory, the caller is expected to
                     # update self._inner._revisioncache after validating the text
                     self._revisioncache = None
                     targetsize = None
                     rawsize = self.index[rev][2]
                     if 0 <= rawsize:
                         targetsize = 4 * rawsize
                     if self._uncompressed_chunk_cache is not None:
                         # dynamically update the uncompressed_chunk_cache size to the
                         # largest revision we saw in this revlog.
                         factor = self.data_config.uncompressed_cache_factor
                         candidate_size = rawsize * factor
                         if candidate_size > self._uncompressed_chunk_cache.maxcost:
                             self._uncompressed_chunk_cache.maxcost = candidate_size
                     bins = self._chunks(chain, targetsize=targetsize)
                     if basetext is None:
                         basetext = bytes(bins[0])
                         bins = bins[1:]
                     rawtext = mdiff.patches(basetext, bins)
                     del basetext  # let us have a chance to free memory early
                     return (rev, rawtext, False)
                 def sidedata(self, rev, sidedata_end):
                     """Return the sidedata for a given revision number."""
                     index_entry = self.index[rev]
                     sidedata_offset = index_entry[8]
                     sidedata_size = index_entry[9]
                     if self.inline:
                         sidedata_offset += self.index.entry_size * (1 + rev)
                     if sidedata_size == 0:
                         return {}
                     if sidedata_end < sidedata_offset + sidedata_size:
                         filename = self.sidedata_file
                         end = sidedata_end
                         offset = sidedata_offset
                         length = sidedata_size
                         m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)
                         raise error.RevlogError(m)
                     comp_segment = self._segmentfile_sidedata.read_chunk(
                         sidedata_offset, sidedata_size
                     )
                     comp = self.index[rev][11]
                     if comp == COMP_MODE_PLAIN:
                         segment = comp_segment
                     elif comp == COMP_MODE_DEFAULT:
                         segment = self._decompressor(comp_segment)
                     elif comp == COMP_MODE_INLINE:
                         segment = self.decompress(comp_segment)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= comp
                         raise error.RevlogError(msg)
                     sidedata = sidedatautil.deserialize_sidedata(segment)
                     return sidedata
                 def write_entry(
                     self,
                     transaction,
                     entry,
                     data,
                     link,
                     offset,
                     sidedata,
                     sidedata_offset,
                     index_end,
                     data_end,
                     sidedata_end,
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     if self._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     ifh, dfh, sdfh = self._writinghandles
                     if index_end is None:
                         ifh.seek(0, os.SEEK_END)
                     else:
                         ifh.seek(index_end, os.SEEK_SET)
                     if dfh:
                         if data_end is None:
                             dfh.seek(0, os.SEEK_END)
                         else:
                             dfh.seek(data_end, os.SEEK_SET)
                     if sdfh:
                         sdfh.seek(sidedata_end, os.SEEK_SET)
                     curr = len(self.index) - 1
                     if not self.inline:
                         transaction.add(self.data_file, offset)
                         if self.sidedata_file:
                             transaction.add(self.sidedata_file, sidedata_offset)
                         transaction.add(self.canonical_index_file, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         if sidedata:
                             sdfh.write(sidedata)
                         if self._delay_buffer is None:
                             ifh.write(entry)
                         else:
                             self._delay_buffer.append(entry)
                     elif self._delay_buffer is not None:
                         msg = b'invalid delayed write on inline revlog'
                         raise error.ProgrammingError(msg)
                     else:
                         offset += curr * self.index.entry_size
                         transaction.add(self.canonical_index_file, offset)
                         assert not sidedata
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                     return (
                         ifh.tell(),
                         dfh.tell() if dfh else None,
                         sdfh.tell() if sdfh else None,
                     )
                 def _divert_index(self):
                     return self.index_file + b'.a'
                 def delay(self):
                     assert not self.is_open
                     if self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     if self._delay_buffer is not None or self._orig_index_file is not None:
                         # delay or divert already in place
                         return None
                     elif len(self.index) == 0:
                         self._orig_index_file = self.index_file
                         self.index_file = self._divert_index()
                         assert self._orig_index_file is not None
                         assert self.index_file is not None
                         if self.opener.exists(self.index_file):
                             self.opener.unlink(self.index_file)
                         return self.index_file
                     else:
                         self._delay_buffer = []
                         return None
                 def write_pending(self):
                     assert not self.is_open
                     if self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     if self._orig_index_file is not None:
                         return None, True
                     any_pending = False
                     pending_index_file = self._divert_index()
                     if self.opener.exists(pending_index_file):
                         self.opener.unlink(pending_index_file)
                     util.copyfile(
                         self.opener.join(self.index_file),
                         self.opener.join(pending_index_file),
                     )
                     if self._delay_buffer:
                         with self.opener(pending_index_file, b'r+') as ifh:
                             ifh.seek(0, os.SEEK_END)
                             ifh.write(b"".join(self._delay_buffer))
                         any_pending = True
                     self._delay_buffer = None
                     self._orig_index_file = self.index_file
                     self.index_file = pending_index_file
                     return self.index_file, any_pending
                 def finalize_pending(self):
                     assert not self.is_open
                     if self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     delay = self._delay_buffer is not None
                     divert = self._orig_index_file is not None
                     if delay and divert:
                         assert False, "unreachable"
                     elif delay:
                         if self._delay_buffer:
                             with self.opener(self.index_file, b'r+') as ifh:
                                 ifh.seek(0, os.SEEK_END)
                                 ifh.write(b"".join(self._delay_buffer))
                         self._delay_buffer = None
                     elif divert:
                         if self.opener.exists(self.index_file):
                             self.opener.rename(
                                 self.index_file,
                                 self._orig_index_file,
                                 checkambig=True,
                             )
                         self.index_file = self._orig_index_file
                         self._orig_index_file = None
                     else:
                         msg = b"not delay or divert found on this revlog"
                         raise error.ProgrammingError(msg)
                     return self.canonical_index_file
             class revlog:
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 If checkambig, indexfile is opened with checkambig=True at
                 writing, to avoid file stat ambiguity.
                 If mmaplargeindex is True, and an mmapindexthreshold is set, the
                 index will be mmapped rather than read if it is larger than the
                 configured threshold.
                 If censorable is True, the revlog can have censored revisions.
                 If `upperboundcomp` is not None, this is the expected maximal gain from
                 compression for the data content.
                 `concurrencychecker` is an optional function that receives 3 arguments: a
                 file handle, a filename, and an expected position. It should check whether
                 the current position in the file handle is valid, and log/warn/fail (by
                 raising).
                 See mercurial/revlogutils/contants.py for details about the content of an
                 index entry.
                 """
                 _flagserrorclass = error.RevlogError
                 @staticmethod
                 def is_inline_index(header_bytes):
                     """Determine if a revlog is inline from the initial bytes of the index"""
                     if len(header_bytes) == 0:
                         return True
                     header = INDEX_HEADER.unpack(header_bytes)[0]
                     _format_flags = header & ~0xFFFF
                     _format_version = header & 0xFFFF
                     features = FEATURES_BY_VERSION[_format_version]
                     return features[b'inline'](_format_flags)
                 def __init__(
                     self,
                     opener,
                     target,
                     radix,
                     postfix=None,  # only exist for `tmpcensored` now
                     checkambig=False,
                     mmaplargeindex=False,
                     censorable=False,
                     upperboundcomp=None,
                     persistentnodemap=False,
                     concurrencychecker=None,
                     trypending=False,
                     try_split=False,
                     canonical_parent_order=True,
                     data_config=None,
                     delta_config=None,
                     feature_config=None,
                     may_inline=True,  # may inline new revlog
                 ):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     `target`: a (KIND, ID) tuple that identify the content stored in
                     this revlog. It help the rest of the code to understand what the revlog
                     is about without having to resort to heuristic and index filename
                     analysis. Note: that this must be reliably be set by normal code, but
                     that test, debug, or performance measurement code might not set this to
                     accurate value.
                     """
                     self.radix = radix
                     self._docket_file = None
                     self._indexfile = None
                     self._datafile = None
                     self._sidedatafile = None
                     self._nodemap_file = None
                     self.postfix = postfix
                     self._trypending = trypending
                     self._try_split = try_split
                     self._may_inline = may_inline
                     self.opener = opener
                     if persistentnodemap:
                         self._nodemap_file = nodemaputil.get_nodemap_file(self)
                     assert target[0] in ALL_KINDS
                     assert len(target) == 2
                     self.target = target
                     if feature_config is not None:
                         self.feature_config = feature_config.copy()
                     elif b'feature-config' in self.opener.options:
                         self.feature_config = self.opener.options[b'feature-config'].copy()
                     else:
                         self.feature_config = FeatureConfig()
                     self.feature_config.censorable = censorable
                     self.feature_config.canonical_parent_order = canonical_parent_order
                     if data_config is not None:
                         self.data_config = data_config.copy()
                     elif b'data-config' in self.opener.options:
                         self.data_config = self.opener.options[b'data-config'].copy()
                     else:
                         self.data_config = DataConfig()
                     self.data_config.check_ambig = checkambig
                     self.data_config.mmap_large_index = mmaplargeindex
                     if delta_config is not None:
                         self.delta_config = delta_config.copy()
                     elif b'delta-config' in self.opener.options:
                         self.delta_config = self.opener.options[b'delta-config'].copy()
                     else:
                         self.delta_config = DeltaConfig()
                     self.delta_config.upper_bound_comp = upperboundcomp
                     # Maps rev to chain base rev.
                     self._chainbasecache = util.lrucachedict(100)
                     self.index = None
                     self._docket = None
                     self._nodemap_docket = None
                     # Mapping of partial identifiers to full nodes.
                     self._pcache = {}
                     # other optionnals features
                     # Make copy of flag processors so each revlog instance can support
                     # custom flags.
                     self._flagprocessors = dict(flagutil.flagprocessors)
                     # prevent nesting of addgroup
                     self._adding_group = None
                     chunk_cache = self._loadindex()
                     self._load_inner(chunk_cache)
                     self._concurrencychecker = concurrencychecker
                 def _init_opts(self):
                     """process options (from above/config) to setup associated default revlog mode
                     These values might be affected when actually reading on disk information.
                     The relevant values are returned for use in _loadindex().
                     * newversionflags:
                         version header to use if we need to create a new revlog
                     * mmapindexthreshold:
                         minimal index size for start to use mmap
                     * force_nodemap:
                         force the usage of a "development" version of the nodemap code
                     """
                     opts = self.opener.options
                     if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:
                         new_header = CHANGELOGV2
                         compute_rank = opts.get(b'changelogv2.compute-rank', True)
                         self.feature_config.compute_rank = compute_rank
                     elif b'revlogv2' in opts:
                         new_header = REVLOGV2
                     elif b'revlogv1' in opts:
                         new_header = REVLOGV1
                         if self._may_inline:
                             new_header |= FLAG_INLINE_DATA
                         if b'generaldelta' in opts:
                             new_header |= FLAG_GENERALDELTA
                     elif b'revlogv0' in self.opener.options:
                         new_header = REVLOGV0
                     else:
                         new_header = REVLOG_DEFAULT_VERSION
                     mmapindexthreshold = None
                     if self.data_config.mmap_large_index:
                         mmapindexthreshold = self.data_config.mmap_index_threshold
                     if self.feature_config.enable_ellipsis:
                         self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor
                     # revlog v0 doesn't have flag processors
                     for flag, processor in opts.get(b'flagprocessors', {}).items():
                         flagutil.insertflagprocessor(flag, processor, self._flagprocessors)
                     chunk_cache_size = self.data_config.chunk_cache_size
                     if chunk_cache_size <= 0:
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not greater than 0')
                             % chunk_cache_size
                         )
                     elif chunk_cache_size & (chunk_cache_size - 1):
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not a power of 2')
                             % chunk_cache_size
                         )
                     force_nodemap = opts.get(b'devel-force-nodemap', False)
                     return new_header, mmapindexthreshold, force_nodemap
                 def _get_data(self, filepath, mmap_threshold, size=None):
                     """return a file content with or without mmap
                     If the file is missing return the empty string"""
                     try:
                         with self.opener(filepath) as fp:
                             if mmap_threshold is not None:
                                 file_size = self.opener.fstat(fp).st_size
                                 if file_size >= mmap_threshold:
                                     if size is not None:
                                         # avoid potentiel mmap crash
                                         size = min(file_size, size)
                                     # TODO: should .close() to release resources without
                                     # relying on Python GC
                                     if size is None:
                                         return util.buffer(util.mmapread(fp))
                                     else:
                                         return util.buffer(util.mmapread(fp, size))
                             if size is None:
                                 return fp.read()
                             else:
                                 return fp.read(size)
                     except FileNotFoundError:
                         return b''
                 def get_streams(self, max_linkrev, force_inline=False):
                     """return a list of streams that represent this revlog
                     This is used by stream-clone to do bytes to bytes copies of a repository.
                     This streams data for all revisions that refer to a changelog revision up
                     to `max_linkrev`.
                     If `force_inline` is set, it enforces that the stream will represent an inline revlog.
                     It returns is a list of three-tuple:
                         [
                             (filename, bytes_stream, stream_size),
                             …
                         ]
                     """
                     n = len(self)
                     index = self.index
                     while n > 0:
                         linkrev = index[n - 1][4]
                         if linkrev < max_linkrev:
                             break
                         # note: this loop will rarely go through multiple iterations, since
                         # it only traverses commits created during the current streaming
                         # pull operation.
                         #
                         # If this become a problem, using a binary search should cap the
                         # runtime of this.
                         n = n - 1
                     if n == 0:
                         # no data to send
                         return []
                     index_size = n * index.entry_size
                     data_size = self.end(n - 1)
                     # XXX we might have been split (or stripped) since the object
                     # initialization, We need to close this race too, but having a way to
                     # pre-open the file we feed to the revlog and never closing them before
                     # we are done streaming.
                     if self._inline:
                         def get_stream():
                             with self.opener(self._indexfile, mode=b"r") as fp:
                                 yield None
                                 size = index_size + data_size
                                 if size <= 65536:
                                     yield fp.read(size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=size)
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     elif force_inline:
                         def get_stream():
                             with self.reading():
                                 yield None
                                 for rev in range(n):
                                     idx = self.index.entry_binary(rev)
                                     if rev == 0 and self._docket is None:
                                         # re-inject the inline flag
                                         header = self._format_flags
                                         header |= self._format_version
                                         header |= FLAG_INLINE_DATA
                                         header = self.index.pack_header(header)
                                         idx = header + idx
                                     yield idx
                                     yield self._inner.get_segment_for_revs(rev, rev)[1]
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     else:
                         def get_index_stream():
                             with self.opener(self._indexfile, mode=b"r") as fp:
                                 yield None
                                 if index_size <= 65536:
                                     yield fp.read(index_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=index_size)
                         def get_data_stream():
                             with self._datafp() as fp:
                                 yield None
                                 if data_size <= 65536:
                                     yield fp.read(data_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=data_size)
                         index_stream = get_index_stream()
                         next(index_stream)
                         data_stream = get_data_stream()
                         next(data_stream)
                         return [
                             (self._datafile, data_stream, data_size),
                             (self._indexfile, index_stream, index_size),
                         ]
                 def _loadindex(self, docket=None):
                     new_header, mmapindexthreshold, force_nodemap = self._init_opts()
                     if self.postfix is not None:
                         entry_point = b'%s.i.%s' % (self.radix, self.postfix)
                     elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):
                         entry_point = b'%s.i.a' % self.radix
                     elif self._try_split and self.opener.exists(self._split_index_file):
                         entry_point = self._split_index_file
                     else:
                         entry_point = b'%s.i' % self.radix
                     if docket is not None:
                         self._docket = docket
                         self._docket_file = entry_point
                     else:
                         self._initempty = True
                         entry_data = self._get_data(entry_point, mmapindexthreshold)
                         if len(entry_data) > 0:
                             header = INDEX_HEADER.unpack(entry_data[:4])[0]
                             self._initempty = False
                         else:
                             header = new_header
                         self._format_flags = header & ~0xFFFF
                         self._format_version = header & 0xFFFF
                         supported_flags = SUPPORTED_FLAGS.get(self._format_version)
                         if supported_flags is None:
                             msg = _(b'unknown version (%d) in revlog %s')
                             msg %= (self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         elif self._format_flags & ~supported_flags:
                             msg = _(b'unknown flags (%#04x) in version %d revlog %s')
                             display_flag = self._format_flags >> 16
                             msg %= (display_flag, self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         features = FEATURES_BY_VERSION[self._format_version]
                         self._inline = features[b'inline'](self._format_flags)
                         self.delta_config.general_delta = features[b'generaldelta'](
                             self._format_flags
                         )
                         self.feature_config.has_side_data = features[b'sidedata']
                         if not features[b'docket']:
                             self._indexfile = entry_point
                             index_data = entry_data
                         else:
                             self._docket_file = entry_point
                             if self._initempty:
                                 self._docket = docketutil.default_docket(self, header)
                             else:
                                 self._docket = docketutil.parse_docket(
                                     self, entry_data, use_pending=self._trypending
                                 )
                     if self._docket is not None:
                         self._indexfile = self._docket.index_filepath()
                         index_data = b''
                         index_size = self._docket.index_end
                         if index_size > 0:
                             index_data = self._get_data(
                                 self._indexfile, mmapindexthreshold, size=index_size
                             )
                             if len(index_data) < index_size:
                                 msg = _(b'too few index data for %s: got %d, expected %d')
                                 msg %= (self.display_id, len(index_data), index_size)
                                 raise error.RevlogError(msg)
                         self._inline = False
                         # generaldelta implied by version 2 revlogs.
                         self.delta_config.general_delta = True
                         # the logic for persistent nodemap will be dealt with within the
                         # main docket, so disable it for now.
                         self._nodemap_file = None
                     if self._docket is not None:
                         self._datafile = self._docket.data_filepath()
                         self._sidedatafile = self._docket.sidedata_filepath()
                     elif self.postfix is None:
                         self._datafile = b'%s.d' % self.radix
                     else:
                         self._datafile = b'%s.d.%s' % (self.radix, self.postfix)
                     self.nodeconstants = sha1nodeconstants
                     self.nullid = self.nodeconstants.nullid
                     # sparse-revlog can't be on without general-delta (issue6056)
                     if not self.delta_config.general_delta:
                         self.delta_config.sparse_revlog = False
                     self._storedeltachains = True
                     devel_nodemap = (
                         self._nodemap_file
                         and force_nodemap
                         and parse_index_v1_nodemap is not None
                     )
                     use_rust_index = False
                     if rustrevlog is not None:
                         if self._nodemap_file is not None:
                             use_rust_index = True
                         else:
                             # Using the CIndex is not longer possible, as the
                             # `AncestorsIterator` and `LazyAncestors` classes now require
                             # a Rust index for instantiation.
                             use_rust_index = True
                     self._parse_index = parse_index_v1
                     if self._format_version == REVLOGV0:
                         self._parse_index = revlogv0.parse_index_v0
                     elif self._format_version == REVLOGV2:
                         self._parse_index = parse_index_v2
                     elif self._format_version == CHANGELOGV2:
                         self._parse_index = parse_index_cl_v2
                     elif devel_nodemap:
                         self._parse_index = parse_index_v1_nodemap
                     elif use_rust_index:
                         self._parse_index = functools.partial(
-                            parse_index_v1_mixed, default_header=new_header
+                            parse_index_v1_rust, default_header=new_header
                         )
                     try:
                         d = self._parse_index(index_data, self._inline)
                         index, chunkcache = d
                         use_nodemap = (
                             not self._inline
                             and self._nodemap_file is not None
                             and hasattr(index, 'update_nodemap_data')
                         )
                         if use_nodemap:
                             nodemap_data = nodemaputil.persisted_data(self)
                             if nodemap_data is not None:
                                 docket = nodemap_data[0]
                                 if (
                                     len(d[0]) > docket.tip_rev
                                     and d[0][docket.tip_rev][7] == docket.tip_node
                                 ):
                                     # no changelog tampering
                                     self._nodemap_docket = docket
                                     index.update_nodemap_data(*nodemap_data)
                     except (ValueError, IndexError):
                         raise error.RevlogError(
                             _(b"index %s is corrupted") % self.display_id
                         )
                     self.index = index
                     # revnum -> (chain-length, sum-delta-length)
                     self._chaininfocache = util.lrucachedict(500)
                     return chunkcache
                 def _load_inner(self, chunk_cache):
                     if self._docket is None:
                         default_compression_header = None
                     else:
                         default_compression_header = self._docket.default_compression_header
                     self._inner = _InnerRevlog(
                         opener=self.opener,
                         index=self.index,
                         index_file=self._indexfile,
                         data_file=self._datafile,
                         sidedata_file=self._sidedatafile,
                         inline=self._inline,
                         data_config=self.data_config,
                         delta_config=self.delta_config,
                         feature_config=self.feature_config,
                         chunk_cache=chunk_cache,
                         default_compression_header=default_compression_header,
                     )
                 def get_revlog(self):
                     """simple function to mirror API of other not-really-revlog API"""
                     return self
                 @util.propertycache
                 def revlog_kind(self):
                     return self.target[0]
                 @util.propertycache
                 def display_id(self):
                     """The public facing "ID" of the revlog that we use in message"""
                     if self.revlog_kind == KIND_FILELOG:
                         # Reference the file without the "data/" prefix, so it is familiar
                         # to the user.
                         return self.target[1]
                     else:
                         return self.radix
                 def _datafp(self, mode=b'r'):
                     """file object for the revlog's data file"""
                     return self.opener(self._datafile, mode=mode)
                 def tiprev(self):
                     return len(self.index) - 1
                 def tip(self):
                     return self.node(self.tiprev())
                 def __contains__(self, rev):
                     return 0 <= rev < len(self)
                 def __len__(self):
                     return len(self.index)
                 def __iter__(self):
                     return iter(range(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     return storageutil.iterrevs(len(self), start=start, stop=stop)
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def _candelta(self, baserev, rev):
                     """whether two revisions (baserev, rev) can be delta-ed or not"""
                     # Disable delta if either rev requires a content-changing flag
                     # processor (ex. LFS). This is because such flag processor can alter
                     # the rawtext content that the delta will be based on, and two clients
                     # could have a same revlog node with different flags (i.e. different
                     # rawtext contents) and the delta could be incompatible.
                     if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (
                         self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS
                     ):
                         return False
                     return True
                 def update_caches(self, transaction):
                     """update on disk cache
                     If a transaction is passed, the update may be delayed to transaction
                     commit."""
                     if self._nodemap_file is not None:
                         if transaction is None:
                             nodemaputil.update_persistent_nodemap(self)
                         else:
                             nodemaputil.setup_persistent_nodemap(transaction, self)
                 def clearcaches(self):
                     """Clear in-memory caches"""
                     self._chainbasecache.clear()
                     self._inner.clear_cache()
                     self._pcache = {}
                     self._nodemap_docket = None
                     self.index.clearcaches()
                     # The python code is the one responsible for validating the docket, we
                     # end up having to refresh it here.
                     use_nodemap = (
                         not self._inline
                         and self._nodemap_file is not None
                         and hasattr(self.index, 'update_nodemap_data')
                     )
                     if use_nodemap:
                         nodemap_data = nodemaputil.persisted_data(self)
                         if nodemap_data is not None:
                             self._nodemap_docket = nodemap_data[0]
                             self.index.update_nodemap_data(*nodemap_data)
                 def rev(self, node):
                     """return the revision number associated with a <nodeid>"""
                     try:
                         return self.index.rev(node)
                     except TypeError:
                         raise
                     except error.RevlogError:
                         # parsers.c radix tree lookup failed
                         if (
                             node == self.nodeconstants.wdirid
                             or node in self.nodeconstants.wdirfilenodeids
                         ):
                             raise error.WdirUnsupported
                         raise error.LookupError(node, self.display_id, _(b'no node'))
                 # Accessors for index entries.
                 # First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
                 # are flags.
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def sidedata_cut_off(self, rev):
                     sd_cut_off = self.index[rev][8]
                     if sd_cut_off != 0:
                         return sd_cut_off
                     # This is some annoying dance, because entries without sidedata
                     # currently use 0 as their ofsset. (instead of previous-offset +
                     # previous-size)
                     #
                     # We should reconsider this sidedata → 0 sidata_offset policy.
                     # In the meantime, we need this.
                     while 0 <= rev:
                         e = self.index[rev]
                         if e[9] != 0:
                             return e[8] + e[9]
                         rev -= 1
                     return 0
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def length(self, rev):
                     return self.index[rev][1]
                 def sidedata_length(self, rev):
                     if not self.feature_config.has_side_data:
                         return 0
                     return self.index[rev][9]
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.rawdata(rev)
                     return len(t)
                 def size(self, rev):
                     """length of non-raw text (processed by a "read" flag processor)"""
                     # fast path: if no "read" flag processor could change the content,
                     # size is rawsize. note: ELLIPSIS is known to not change the content.
                     flags = self.flags(rev)
                     if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
                         return self.rawsize(rev)
                     return len(self.revision(rev))
                 def fast_rank(self, rev):
                     """Return the rank of a revision if already known, or None otherwise.
                     The rank of a revision is the size of the sub-graph it defines as a
                     head. Equivalently, the rank of a revision `r` is the size of the set
                     `ancestors(r)`, `r` included.
                     This method returns the rank retrieved from the revlog in constant
                     time. It makes no attempt at computing unknown values for versions of
                     the revlog which do not persist the rank.
                     """
                     rank = self.index[rev][ENTRY_RANK]
                     if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:
                         return None
                     if rev == nullrev:
                         return 0  # convention
                     return rank
                 def chainbase(self, rev):
                     base = self._chainbasecache.get(rev)
                     if base is not None:
                         return base
                     index = self.index
                     iterrev = rev
                     base = index[iterrev][3]
                     while base != iterrev:
                         iterrev = base
                         base = index[iterrev][3]
                     self._chainbasecache[rev] = base
                     return base
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parentrevs(self, rev):
                     try:
                         entry = self.index[rev]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                     if self.feature_config.canonical_parent_order and entry[5] == nullrev:
                         return entry[6], entry[5]
                     else:
                         return entry[5], entry[6]
                 # fast parentrevs(rev) where rev isn't filtered
                 _uncheckedparentrevs = parentrevs
                 def node(self, rev):
                     try:
                         return self.index[rev][7]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                 # Derived from index values.
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     # inline node() to avoid function call overhead
                     if self.feature_config.canonical_parent_order and d[5] == self.nullid:
                         return i[d[6]][7], i[d[5]][7]
                     else:
                         return i[d[5]][7], i[d[6]][7]
                 def chainlen(self, rev):
                     return self._chaininfo(rev)[0]
                 def _chaininfo(self, rev):
                     chaininfocache = self._chaininfocache
                     if rev in chaininfocache:
                         return chaininfocache[rev]
                     index = self.index
                     generaldelta = self.delta_config.general_delta
                     iterrev = rev
                     e = index[iterrev]
                     clen = 0
                     compresseddeltalen = 0
                     while iterrev != e[3]:
                         clen += 1
                         compresseddeltalen += e[1]
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         if iterrev in chaininfocache:
                             t = chaininfocache[iterrev]
                             clen += t[0]
                             compresseddeltalen += t[1]
                             break
                         e = index[iterrev]
                     else:
                         # Add text length of base since decompressing that also takes
                         # work. For cache hits the length is already included.
                         compresseddeltalen += e[1]
                     r = (clen, compresseddeltalen)
                     chaininfocache[rev] = r
                     return r
                 def _deltachain(self, rev, stoprev=None):
                     return self._inner._deltachain(rev, stoprev=stoprev)
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse revision order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     # first, make sure start revisions aren't filtered
                     revs = list(revs)
                     checkrev = self.node
                     for r in revs:
                         checkrev(r)
                     # and we're sure ancestors aren't filtered as well
                     if rustancestor is not None and self.index.rust_ext_compat:
                         lazyancestors = rustancestor.LazyAncestors
                         arg = self.index
                     else:
                         lazyancestors = ancestor.lazyancestors
                         arg = self._uncheckedparentrevs
                     return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)
                 def descendants(self, revs):
                     return dagop.descendantrevs(revs, self.revs, self.parentrevs)
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset:
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = collections.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(miss) for miss in missing]
                 def incrementalmissingrevs(self, common=None):
                     """Return an object that can be used to incrementally compute the
                     revision numbers of the ancestors of arbitrary sets that are not
                     ancestors of common. This is an ancestor.incrementalmissingancestors
                     object.
                     'common' is a list of revision numbers. If common is not supplied, uses
                     nullrev.
                     """
                     if common is None:
                         common = [nullrev]
                     if rustancestor is not None and self.index.rust_ext_compat:
                         return rustancestor.MissingAncestors(self.index, common)
                     return ancestor.incrementalmissingancestors(self.parentrevs, common)
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     inc = self.incrementalmissingrevs(common=common)
                     return inc.missingancestors(heads)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     inc = self.incrementalmissingrevs(common=common)
                     return [self.node(r) for r in inc.missingancestors(heads)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [self.nullid]  # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return (
                             [self.node(r) for r in self],
                             [self.nullid],
                             list(self.heads()),
                         )
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == self.nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n)  # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update(
                                         [p for p in self.parents(n) if p != self.nullid]
                                     )
                                 elif n in heads:  # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [root for root in roots if root in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(root) for root in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [self.nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [head for head, flag in heads.items() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self, revs=None):
                     if revs is None:
                         try:
                             return self.index.headrevs()
                         except AttributeError:
                             return self._headrevs()
                     if rustdagop is not None and self.index.rust_ext_compat:
                         return rustdagop.headrevs(self.index, revs)
                     return dagop.headrevs(revs, self._uncheckedparentrevs)
                 def computephases(self, roots):
                     return self.index.computephasesmapsets(roots)
                 def _headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     # we won't iter over filtered rev so nobody is a head at start
                     ishead = [0] * (count + 1)
                     index = self.index
                     for r in self:
                         ishead[r] = 1  # I may be an head
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                     return [r for r, val in enumerate(ishead) if val]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [self.nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullrev
                     else:
                         start = self.rev(start)
                     stoprevs = {self.rev(n) for n in stop or []}
                     revs = dagop.headrevssubset(
                         self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs
                     )
                     return [self.node(rev) for rev in revs]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     ancs = self._commonancestorsheads(a, b)
                     return pycompat.maplist(self.node, ancs)
                 def _commonancestorsheads(self, *revs):
                     """calculate all the heads of the common ancestors of revs"""
                     try:
                         ancs = self.index.commonancestorsheads(*revs)
                     except (AttributeError, OverflowError):  # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
                     return ancs
                 def isancestor(self, a, b):
                     """return True if node a is an ancestor of node b
                     A revision is considered an ancestor of itself."""
                     a, b = self.rev(a), self.rev(b)
                     return self.isancestorrev(a, b)
                 def isancestorrev(self, a, b):
                     """return True if revision a is an ancestor of revision b
                     A revision is considered an ancestor of itself.
                     The implementation of this is trivial but the use of
                     reachableroots is not."""
                     if a == nullrev:
                         return True
                     elif a == b:
                         return True
                     elif a > b:
                         return False
                     return bool(self.reachableroots(a, [b], [a], includepath=False))
                 def reachableroots(self, minroot, heads, roots, includepath=False):
                     """return (heads(::(<roots> and <roots>::<heads>)))
                     If includepath is True, return (<roots>::<heads>)."""
                     try:
                         return self.index.reachableroots2(
                             minroot, heads, roots, includepath
                         )
                     except AttributeError:
                         return dagop._reachablerootspure(
                             self.parentrevs, minroot, roots, heads, includepath
                         )
                 def ancestor(self, a, b):
                     """calculate the "best" common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)
                     except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
                         return min(map(self.node, ancs))
                     return self.nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == self.nodeconstants.nodelen:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node)  # quick search the index
                             return node
                         except error.LookupError:
                             pass  # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if b"%d" % rev != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 2 * self.nodeconstants.nodelen:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (binascii.Error, error.LookupError):
                             pass
                 def _partialmatch(self, id):
                     # we don't care wdirfilenodeids as they should be always full hash
                     maybewdir = self.nodeconstants.wdirhex.startswith(id)
                     ambiguous = False
                     try:
                         partial = self.index.partialmatch(id)
                         if partial and self.hasnode(partial):
                             if maybewdir:
                                 # single 'ff...' match in radix tree, ambiguous with wdir
                                 ambiguous = True
                             else:
                                 return partial
                         elif maybewdir:
                             # no 'ff...' match in radix tree, wdir identified
                             raise error.WdirUnsupported
                         else:
                             return None
                     except error.RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fast path: for unfiltered changelog, radix tree is accurate
                         if not getattr(self, 'filteredrevs', None):
                             ambiguous = True
                         # fall through to slow path that filters hidden revisions
                     except (AttributeError, ValueError):
                         # we are pure python, or key is not hex
                         pass
                     if ambiguous:
                         raise error.AmbiguousPrefixLookupError(
                             id, self.display_id, _(b'ambiguous identifier')
                         )
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) <= 40:
                         # hex(node)[:...]
                         l = len(id) // 2 * 2  # grab an even number of digits
                         try:
                             # we're dropping the last digit, so let's check that it's hex,
                             # to avoid the expensive computation below if it's not
                             if len(id) % 2 > 0:
                                 if not (id[-1] in hexdigits):
                                     return None
                             prefix = bin(id[:l])
                         except binascii.Error:
                             pass
                         else:
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [
                                 n for n in nl if hex(n).startswith(id) and self.hasnode(n)
                             ]
                             if self.nodeconstants.nullhex.startswith(id):
                                 nl.append(self.nullid)
                             if len(nl) > 0:
                                 if len(nl) == 1 and not maybewdir:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise error.AmbiguousPrefixLookupError(
                                     id, self.display_id, _(b'ambiguous identifier')
                                 )
                             if maybewdir:
                                 raise error.WdirUnsupported
                             return None
                 def lookup(self, id):
                     """locate a node based on:
                     - revision number or str(revision number)
                     - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise error.LookupError(id, self.display_id, _(b'no match found'))
                 def shortest(self, node, minlength=1):
                     """Find the shortest unambiguous prefix that matches node."""
                     def isvalid(prefix):
                         try:
                             matchednode = self._partialmatch(prefix)
                         except error.AmbiguousPrefixLookupError:
                             return False
                         except error.WdirUnsupported:
                             # single 'ff...' match
                             return True
                         if matchednode is None:
                             raise error.LookupError(node, self.display_id, _(b'no node'))
                         return True
                     def maybewdir(prefix):
                         return all(c == b'f' for c in pycompat.iterbytestr(prefix))
                     hexnode = hex(node)
                     def disambiguate(hexnode, minlength):
                         """Disambiguate against wdirid."""
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if not maybewdir(prefix):
                                 return prefix
                     if not getattr(self, 'filteredrevs', None):
                         try:
                             length = max(self.index.shortest(node), minlength)
                             return disambiguate(hexnode, length)
                         except error.RevlogError:
                             if node != self.nodeconstants.wdirid:
                                 raise error.LookupError(
                                     node, self.display_id, _(b'no node')
                                 )
                         except AttributeError:
                             # Fall through to pure code
                             pass
                     if node == self.nodeconstants.wdirid:
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if isvalid(prefix):
                                 return prefix
                     for length in range(minlength, len(hexnode) + 1):
                         prefix = hexnode[:length]
                         if isvalid(prefix):
                             return disambiguate(hexnode, length)
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return storageutil.hashrevisionsha1(text, p1, p2) != node
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self.delta_config.general_delta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     ret = self._inner.issnapshot(rev)
                     self.issnapshot = self._inner.issnapshot
                     return ret
                 def snapshotdepth(self, rev):
                     """number of snapshot in the chain before this one"""
                     if not self.issnapshot(rev):
                         raise error.ProgrammingError(b'revision %d not a snapshot')
                     return len(self._inner._deltachain(rev)[0]) - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions
                     The delta calculated is in binary form and is intended to be written to
                     revlog data directly. So this function needs raw revision data.
                     """
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return bytes(self._inner._chunk(rev2))
                     return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))
                 def revision(self, nodeorrev):
                     """return an uncompressed revision of a given node or revision
                     number.
                     """
                     return self._revisiondata(nodeorrev)
                 def sidedata(self, nodeorrev):
                     """a map of extra data related to the changeset but not part of the hash
                     This function currently return a dictionary. However, more advanced
                     mapping object will likely be used in the future for a more
                     efficient/lazy code.
                     """
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                     else:
                         rev = self.rev(nodeorrev)
                     return self._sidedata(rev)
                 def _rawtext(self, node, rev):
                     """return the possibly unvalidated rawtext for a revision
                     returns (rev, rawtext, validated)
                     """
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._inner._revisioncache:
                         if self._inner._revisioncache[0] == node:
                             return (rev, self._inner._revisioncache[2], True)
                     if rev is None:
                         rev = self.rev(node)
                     return self._inner.raw_text(node, rev)
                 def _revisiondata(self, nodeorrev, raw=False):
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     # fast path the special `nullid` rev
                     if node == self.nullid:
                         return b""
                     # ``rawtext`` is the text as stored inside the revlog. Might be the
                     # revision or might need to be processed to retrieve the revision.
                     rev, rawtext, validated = self._rawtext(node, rev)
                     if raw and validated:
                         # if we don't want to process the raw text and that raw
                         # text is cached, we can exit early.
                         return rawtext
                     if rev is None:
                         rev = self.rev(node)
                     # the revlog's flag for this revision
                     # (usually alter its state or content)
                     flags = self.flags(rev)
                     if validated and flags == REVIDX_DEFAULT_FLAGS:
                         # no extra flags set, no flag processor runs, text = rawtext
                         return rawtext
                     if raw:
                         validatehash = flagutil.processflagsraw(self, rawtext, flags)
                         text = rawtext
                     else:
                         r = flagutil.processflagsread(self, rawtext, flags)
                         text, validatehash = r
                     if validatehash:
                         self.checkhash(text, node, rev=rev)
                     if not validated:
                         self._inner._revisioncache = (node, rev, rawtext)
                     return text
                 def _sidedata(self, rev):
                     """Return the sidedata for a given revision number."""
                     sidedata_end = None
                     if self._docket is not None:
                         sidedata_end = self._docket.sidedata_end
                     return self._inner.sidedata(rev, sidedata_end)
                 def rawdata(self, nodeorrev):
                     """return an uncompressed raw data of a given node or revision number."""
                     return self._revisiondata(nodeorrev, raw=True)
                 def hash(self, text, p1, p2):
                     """Compute a node hash.
                     Available as a function so that subclasses can replace the hash
                     as needed.
                     """
                     return storageutil.hashrevisionsha1(text, p1, p2)
                 def checkhash(self, text, node, p1=None, p2=None, rev=None):
                     """Check node hash integrity.
                     Available as a function so that subclasses can extend hash mismatch
                     behaviors as needed.
                     """
                     try:
                         if p1 is None and p2 is None:
                             p1, p2 = self.parents(node)
                         if node != self.hash(text, p1, p2):
                             # Clear the revision cache on hash failure. The revision cache
                             # only stores the raw revision and clearing the cache does have
                             # the side-effect that we won't have a cache hit when the raw
                             # revision data is accessed. But this case should be rare and
                             # it is extra work to teach the cache about the hash
                             # verification state.
                             if (
                                 self._inner._revisioncache
                                 and self._inner._revisioncache[0] == node
                             ):
                                 self._inner._revisioncache = None
                             revornode = rev
                             if revornode is None:
                                 revornode = templatefilters.short(hex(node))
                             raise error.RevlogError(
                                 _(b"integrity check failed on %s:%s")
                                 % (self.display_id, pycompat.bytestr(revornode))
                             )
                     except error.RevlogError:
                         if self.feature_config.censorable and storageutil.iscensoredtext(
                             text
                         ):
                             raise error.CensoredNodeError(self.display_id, node, text)
                         raise
                 @property
                 def _split_index_file(self):
                     """the path where to expect the index of an ongoing splitting operation
                     The file will only exist if a splitting operation is in progress, but
                     it is always expected at the same location."""
                     parts = self.radix.split(b'/')
                     if len(parts) > 1:
                         # adds a '-s' prefix to the ``data/` or `meta/` base
                         head = parts[0] + b'-s'
                         mids = parts[1:-1]
                         tail = parts[-1] + b'.i'
                         pieces = [head] + mids + [tail]
                         return b'/'.join(pieces)
                     else:
                         # the revlog is stored at the root of the store (changelog or
                         # manifest), no risk of collision.
                         return self.radix + b'.i.s'
                 def _enforceinlinesize(self, tr, side_write=True):
                     """Check if the revlog is too big for inline and convert if so.
                     This should be called after revisions are added to the revlog. If the
                     revlog has grown too large to be an inline revlog, it will convert it
                     to use multiple index and data files.
                     """
                     tiprev = len(self) - 1
                     total_size = self.start(tiprev) + self.length(tiprev)
                     if not self._inline or (self._may_inline and total_size < _maxinline):
                         return
                     if self._docket is not None:
                         msg = b"inline revlog should not have a docket"
                         raise error.ProgrammingError(msg)
                     # In the common case, we enforce inline size because the revlog has
                     # been appened too. And in such case, it must have an initial offset
                     # recorded in the transaction.
                     troffset = tr.findoffset(self._inner.canonical_index_file)
                     pre_touched = troffset is not None
                     if not pre_touched and self.target[0] != KIND_CHANGELOG:
                         raise error.RevlogError(
                             _(b"%s not found in the transaction") % self._indexfile
                         )
                     tr.addbackup(self._inner.canonical_index_file, for_offset=pre_touched)
                     tr.add(self._datafile, 0)
                     new_index_file_path = None
                     if side_write:
                         old_index_file_path = self._indexfile
                         new_index_file_path = self._split_index_file
                         opener = self.opener
                         weak_self = weakref.ref(self)
                         # the "split" index replace the real index when the transaction is
                         # finalized
                         def finalize_callback(tr):
                             opener.rename(
                                 new_index_file_path,
                                 old_index_file_path,
                                 checkambig=True,
                             )
                             maybe_self = weak_self()
                             if maybe_self is not None:
                                 maybe_self._indexfile = old_index_file_path
                                 maybe_self._inner.index_file = maybe_self._indexfile
                         def abort_callback(tr):
                             maybe_self = weak_self()
                             if maybe_self is not None:
                                 maybe_self._indexfile = old_index_file_path
                                 maybe_self._inner.inline = True
                                 maybe_self._inner.index_file = old_index_file_path
                         tr.registertmp(new_index_file_path)
                         if self.target[1] is not None:
                             callback_id = b'000-revlog-split-%d-%s' % self.target
                         else:
                             callback_id = b'000-revlog-split-%d' % self.target[0]
                         tr.addfinalize(callback_id, finalize_callback)
                         tr.addabort(callback_id, abort_callback)
                     self._format_flags &= ~FLAG_INLINE_DATA
                     self._inner.split_inline(
                         tr,
                         self._format_flags | self._format_version,
                         new_index_file_path=new_index_file_path,
                     )
                     self._inline = False
                     if new_index_file_path is not None:
                         self._indexfile = new_index_file_path
                     nodemaputil.setup_persistent_nodemap(tr, self)
                 def _nodeduplicatecallback(self, transaction, node):
                     """called when trying to add a node already stored."""
                 @contextlib.contextmanager
                 def reading(self):
                     with self._inner.reading():
                         yield
                 @contextlib.contextmanager
                 def _writing(self, transaction):
                     if self._trypending:
                         msg = b'try to write in a `trypending` revlog: %s'
                         msg %= self.display_id
                         raise error.ProgrammingError(msg)
                     if self._inner.is_writing:
                         yield
                     else:
                         data_end = None
                         sidedata_end = None
                         if self._docket is not None:
                             data_end = self._docket.data_end
                             sidedata_end = self._docket.sidedata_end
                         with self._inner.writing(
                             transaction,
                             data_end=data_end,
                             sidedata_end=sidedata_end,
                         ):
                             yield
                             if self._docket is not None:
                                 self._write_docket(transaction)
                 @property
                 def is_delaying(self):
                     return self._inner.is_delaying
                 def _write_docket(self, transaction):
                     """write the current docket on disk
                     Exist as a method to help changelog to implement transaction logic
                     We could also imagine using the same transaction logic for all revlog
                     since docket are cheap."""
                     self._docket.write(transaction)
                 def addrevision(
                     self,
                     text,
                     transaction,
                     link,
                     p1,
                     p2,
                     cachedelta=None,
                     node=None,
                     flags=REVIDX_DEFAULT_FLAGS,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     flags - the known flags to set on the revision
                     deltacomputer - an optional deltacomputer instance shared between
                         multiple calls
                     """
                     if link == nullrev:
                         raise error.RevlogError(
                             _(b"attempted to add linkrev -1 to %s") % self.display_id
                         )
                     if sidedata is None:
                         sidedata = {}
                     elif sidedata and not self.feature_config.has_side_data:
                         raise error.ProgrammingError(
                             _(b"trying to add sidedata to a revlog who don't support them")
                         )
                     if flags:
                         node = node or self.hash(text, p1, p2)
                     rawtext, validatehash = flagutil.processflagswrite(self, text, flags)
                     # If the flag processor modifies the revision data, ignore any provided
                     # cachedelta.
                     if rawtext != text:
                         cachedelta = None
                     if len(rawtext) > _maxentrysize:
                         raise error.RevlogError(
                             _(
                                 b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"
                             )
                             % (self.display_id, len(rawtext))
                         )
                     node = node or self.hash(rawtext, p1, p2)
                     rev = self.index.get_rev(node)
                     if rev is not None:
                         return rev
                     if validatehash:
                         self.checkhash(rawtext, node, p1=p1, p2=p2)
                     return self.addrawrevision(
                         rawtext,
                         transaction,
                         link,
                         p1,
                         p2,
                         node,
                         flags,
                         cachedelta=cachedelta,
                         deltacomputer=deltacomputer,
                         sidedata=sidedata,
                     )
                 def addrawrevision(
                     self,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     node,
                     flags,
                     cachedelta=None,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a raw revision with known flags, node and parents
                     useful when reusing a revision not stored in this revlog (ex: received
                     over wire, or read from an external bundle).
                     """
                     with self._writing(transaction):
                         return self._addrevision(
                             node,
                             rawtext,
                             transaction,
                             link,
                             p1,
                             p2,
                             flags,
                             cachedelta,
                             deltacomputer=deltacomputer,
                             sidedata=sidedata,
                         )
                 def compress(self, data):
                     return self._inner.compress(data)
                 def decompress(self, data):
                     return self._inner.decompress(data)
                 def _addrevision(
                     self,
                     node,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     flags,
                     cachedelta,
                     alwayscache=False,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
                     if "deltacomputer" is not provided or None, a defaultdeltacomputer will
                     be used.
                     invariants:
                     - rawtext is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     if node == self.nullid:
                         raise error.RevlogError(
                             _(b"%s: attempt to add null revision") % self.display_id
                         )
                     if (
                         node == self.nodeconstants.wdirid
                         or node in self.nodeconstants.wdirfilenodeids
                     ):
                         raise error.RevlogError(
                             _(b"%s: attempt to add wdir revision") % self.display_id
                         )
                     if self._inner._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     btext = [rawtext]
                     curr = len(self)
                     prev = curr - 1
                     offset = self._get_data_offset(prev)
                     if self._concurrencychecker:
                         ifh, dfh, sdfh = self._inner._writinghandles
                         # XXX no checking for the sidedata file
                         if self._inline:
                             # offset is "as if" it were in the .d file, so we need to add on
                             # the size of the entry metadata.
                             self._concurrencychecker(
                                 ifh, self._indexfile, offset + curr * self.index.entry_size
                             )
                         else:
                             # Entries in the .i are a consistent size.
                             self._concurrencychecker(
                                 ifh, self._indexfile, curr * self.index.entry_size
                             )
                             self._concurrencychecker(dfh, self._datafile, offset)
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if rawtext is None:
                         # need rawtext size, before changed by flag processors, which is
                         # the non-raw size. use revlog explicitly to avoid filelog's extra
                         # logic that might remove metadata size.
                         textlen = mdiff.patchedsize(
                             revlog.size(self, cachedelta[0]), cachedelta[1]
                         )
                     else:
                         textlen = len(rawtext)
                     if deltacomputer is None:
                         write_debug = None
                         if self.delta_config.debug_delta:
                             write_debug = transaction._report
                         deltacomputer = deltautil.deltacomputer(
                             self, write_debug=write_debug
                         )
                     if cachedelta is not None and len(cachedelta) == 2:
                         # If the cached delta has no information about how it should be
                         # reused, add the default reuse instruction according to the
                         # revlog's configuration.
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse = DELTA_BASE_REUSE_NO
                         cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)
                     revinfo = revlogutils.revisioninfo(
                         node,
                         p1,
                         p2,
                         btext,
                         textlen,
                         cachedelta,
                         flags,
                     )
                     deltainfo = deltacomputer.finddeltainfo(revinfo)
                     compression_mode = COMP_MODE_INLINE
                     if self._docket is not None:
                         default_comp = self._docket.default_compression_header
                         r = deltautil.delta_compression(default_comp, deltainfo)
                         compression_mode, deltainfo = r
                     sidedata_compression_mode = COMP_MODE_INLINE
                     if sidedata and self.feature_config.has_side_data:
                         sidedata_compression_mode = COMP_MODE_PLAIN
                         serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)
                         sidedata_offset = self._docket.sidedata_end
                         h, comp_sidedata = self._inner.compress(serialized_sidedata)
                         if (
                             h != b'u'
                             and comp_sidedata[0:1] != b'\0'
                             and len(comp_sidedata) < len(serialized_sidedata)
                         ):
                             assert not h
                             if (
                                 comp_sidedata[0:1]
                                 == self._docket.default_compression_header
                             ):
                                 sidedata_compression_mode = COMP_MODE_DEFAULT
                                 serialized_sidedata = comp_sidedata
                             else:
                                 sidedata_compression_mode = COMP_MODE_INLINE
                                 serialized_sidedata = comp_sidedata
                     else:
                         serialized_sidedata = b""
                         # Don't store the offset if the sidedata is empty, that way
                         # we can easily detect empty sidedata and they will be no different
                         # than ones we manually add.
                         sidedata_offset = 0
                     rank = RANK_UNKNOWN
                     if self.feature_config.compute_rank:
                         if (p1r, p2r) == (nullrev, nullrev):
                             rank = 1
                         elif p1r != nullrev and p2r == nullrev:
                             rank = 1 + self.fast_rank(p1r)
                         elif p1r == nullrev and p2r != nullrev:
                             rank = 1 + self.fast_rank(p2r)
                         else:  # merge node
                             if rustdagop is not None and self.index.rust_ext_compat:
                                 rank = rustdagop.rank(self.index, p1r, p2r)
                             else:
                                 pmin, pmax = sorted((p1r, p2r))
                                 rank = 1 + self.fast_rank(pmax)
                                 rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))
                     e = revlogutils.entry(
                         flags=flags,
                         data_offset=offset,
                         data_compressed_length=deltainfo.deltalen,
                         data_uncompressed_length=textlen,
                         data_compression_mode=compression_mode,
                         data_delta_base=deltainfo.base,
                         link_rev=link,
                         parent_rev_1=p1r,
                         parent_rev_2=p2r,
                         node_id=node,
                         sidedata_offset=sidedata_offset,
                         sidedata_compressed_length=len(serialized_sidedata),
                         sidedata_compression_mode=sidedata_compression_mode,
                         rank=rank,
                     )
                     self.index.append(e)
                     entry = self.index.entry_binary(curr)
                     if curr == 0 and self._docket is None:
                         header = self._format_flags | self._format_version
                         header = self.index.pack_header(header)
                         entry = header + entry
                     self._writeentry(
                         transaction,
                         entry,
                         deltainfo.data,
                         link,
                         offset,
                         serialized_sidedata,
                         sidedata_offset,
                     )
                     rawtext = btext[0]
                     if alwayscache and rawtext is None:
                         rawtext = deltacomputer.buildtext(revinfo)
                     if type(rawtext) == bytes:  # only accept immutable objects
                         self._inner._revisioncache = (node, curr, rawtext)
                     self._chainbasecache[curr] = deltainfo.chainbase
                     return curr
                 def _get_data_offset(self, prev):
                     """Returns the current offset in the (in-transaction) data file.
                     Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket
                     file to store that information: since sidedata can be rewritten to the
                     end of the data file within a transaction, you can have cases where, for
                     example, rev `n` does not have sidedata while rev `n - 1` does, leading
                     to `n - 1`'s sidedata being written after `n`'s data.
                     TODO cache this in a docket file before getting out of experimental."""
                     if self._docket is None:
                         return self.end(prev)
                     else:
                         return self._docket.data_end
                 def _writeentry(
                     self,
                     transaction,
                     entry,
                     data,
                     link,
                     offset,
                     sidedata,
                     sidedata_offset,
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     index_end = data_end = sidedata_end = None
                     if self._docket is not None:
                         index_end = self._docket.index_end
                         data_end = self._docket.data_end
                         sidedata_end = self._docket.sidedata_end
                     files_end = self._inner.write_entry(
                         transaction,
                         entry,
                         data,
                         link,
                         offset,
                         sidedata,
                         sidedata_offset,
                         index_end,
                         data_end,
                         sidedata_end,
                     )
                     self._enforceinlinesize(transaction)
                     if self._docket is not None:
                         self._docket.index_end = files_end[0]
                         self._docket.data_end = files_end[1]
                         self._docket.sidedata_end = files_end[2]
                     nodemaputil.setup_persistent_nodemap(transaction, self)
                 def addgroup(
                     self,
                     deltas,
                     linkmapper,
                     transaction,
                     alwayscache=False,
                     addrevisioncb=None,
                     duplicaterevisioncb=None,
                     debug_info=None,
                     delta_base_reuse_policy=None,
                 ):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     If ``addrevisioncb`` is defined, it will be called with arguments of
                     this revlog and the node that was added.
                     """
                     if self._adding_group:
                         raise error.ProgrammingError(b'cannot nest addgroup() calls')
                     # read the default delta-base reuse policy from revlog config if the
                     # group did not specify one.
                     if delta_base_reuse_policy is None:
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse_policy = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse_policy = DELTA_BASE_REUSE_NO
                     self._adding_group = True
                     empty = True
                     try:
                         with self._writing(transaction):
                             write_debug = None
                             if self.delta_config.debug_delta:
                                 write_debug = transaction._report
                             deltacomputer = deltautil.deltacomputer(
                                 self,
                                 write_debug=write_debug,
                                 debug_info=debug_info,
                             )
                             # loop through our set of deltas
                             for data in deltas:
                                 (
                                     node,
                                     p1,
                                     p2,
                                     linknode,
                                     deltabase,
                                     delta,
                                     flags,
                                     sidedata,
                                 ) = data
                                 link = linkmapper(linknode)
                                 flags = flags or REVIDX_DEFAULT_FLAGS
                                 rev = self.index.get_rev(node)
                                 if rev is not None:
                                     # this can happen if two branches make the same change
                                     self._nodeduplicatecallback(transaction, rev)
                                     if duplicaterevisioncb:
                                         duplicaterevisioncb(self, rev)
                                     empty = False
                                     continue
                                 for p in (p1, p2):
                                     if not self.index.has_node(p):
                                         raise error.LookupError(
                                             p, self.radix, _(b'unknown parent')
                                         )
                                 if not self.index.has_node(deltabase):
                                     raise error.LookupError(
                                         deltabase, self.display_id, _(b'unknown delta base')
                                     )
                                 baserev = self.rev(deltabase)
                                 if baserev != nullrev and self.iscensored(baserev):
                                     # if base is censored, delta must be full replacement in a
                                     # single patch operation
                                     hlen = struct.calcsize(b">lll")
                                     oldlen = self.rawsize(baserev)
                                     newlen = len(delta) - hlen
                                     if delta[:hlen] != mdiff.replacediffheader(
                                         oldlen, newlen
                                     ):
                                         raise error.CensoredBaseError(
                                             self.display_id, self.node(baserev)
                                         )
                                 if not flags and self._peek_iscensored(baserev, delta):
                                     flags |= REVIDX_ISCENSORED
                                 # We assume consumers of addrevisioncb will want to retrieve
                                 # the added revision, which will require a call to
                                 # revision(). revision() will fast path if there is a cache
                                 # hit. So, we tell _addrevision() to always cache in this case.
                                 # We're only using addgroup() in the context of changegroup
                                 # generation so the revision data can always be handled as raw
                                 # by the flagprocessor.
                                 rev = self._addrevision(
                                     node,
                                     None,
                                     transaction,
                                     link,
                                     p1,
                                     p2,
                                     flags,
                                     (baserev, delta, delta_base_reuse_policy),
                                     alwayscache=alwayscache,
                                     deltacomputer=deltacomputer,
                                     sidedata=sidedata,
                                 )
                                 if addrevisioncb:
                                     addrevisioncb(self, rev)
                                 empty = False
                     finally:
                         self._adding_group = False
                     return not empty
                 def iscensored(self, rev):
                     """Check if a file revision is censored."""
                     if not self.feature_config.censorable:
                         return False
                     return self.flags(rev) & REVIDX_ISCENSORED
                 def _peek_iscensored(self, baserev, delta):
                     """Quickly check if a delta produces a censored revision."""
                     if not self.feature_config.censorable:
                         return False
                     return storageutil.deltaiscensored(delta, baserev, self.rawsize)
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     return storageutil.resolvestripinfo(
                         minlink,
                         len(self) - 1,
                         self.headrevs(),
                         self.linkrev,
                         self.parentrevs,
                     )
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     data_end = self.start(rev)
                     if not self._inline:
                         transaction.add(self._datafile, data_end)
                         end = rev * self.index.entry_size
                     else:
                         end = data_end + (rev * self.index.entry_size)
                     if self._sidedatafile:
                         sidedata_end = self.sidedata_cut_off(rev)
                         transaction.add(self._sidedatafile, sidedata_end)
                     transaction.add(self._indexfile, end)
                     if self._docket is not None:
                         # XXX we could, leverage the docket while stripping. However it is
                         # not powerfull enough at the time of this comment
                         self._docket.index_end = end
                         self._docket.data_end = data_end
                         self._docket.sidedata_end = sidedata_end
                         self._docket.write(transaction, stripping=True)
                     # then reset internal state in memory to forget those revisions
                     self._chaininfocache = util.lrucachedict(500)
                     self._inner.clear_cache()
                     del self.index[rev:-1]
                 def checksize(self):
                     """Check size of index and data files
                     return a (dd, di) tuple.
                     - dd: extra bytes for the "data" file
                     - di: extra bytes for the "index" file
                     A healthy revlog will return (0, 0).
                     """
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         with self._datafp() as f:
                             f.seek(0, io.SEEK_END)
                             actual = f.tell()
                         dd = actual - expected
                     except FileNotFoundError:
                         dd = 0
                     try:
                         f = self.opener(self._indexfile)
                         f.seek(0, io.SEEK_END)
                         actual = f.tell()
                         f.close()
                         s = self.index.entry_size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except FileNotFoundError:
                         di = 0
                     return (dd, di)
                 def files(self):
                     """return list of files that compose this revlog"""
                     res = [self._indexfile]
                     if self._docket_file is None:
                         if not self._inline:
                             res.append(self._datafile)
                     else:
                         res.append(self._docket_file)
                         res.extend(self._docket.old_index_filepaths(include_empty=False))
                         if self._docket.data_end:
                             res.append(self._datafile)
                         res.extend(self._docket.old_data_filepaths(include_empty=False))
                         if self._docket.sidedata_end:
                             res.append(self._sidedatafile)
                         res.extend(self._docket.old_sidedata_filepaths(include_empty=False))
                     return res
                 def emitrevisions(
                     self,
                     nodes,
                     nodesorder=None,
                     revisiondata=False,
                     assumehaveparentrevisions=False,
                     deltamode=repository.CG_DELTAMODE_STD,
                     sidedata_helpers=None,
                     debug_info=None,
                 ):
                     if nodesorder not in (b'nodes', b'storage', b'linear', None):
                         raise error.ProgrammingError(
                             b'unhandled value for nodesorder: %s' % nodesorder
                         )
                     if nodesorder is None and not self.delta_config.general_delta:
                         nodesorder = b'storage'
                     if (
                         not self._storedeltachains
                         and deltamode != repository.CG_DELTAMODE_PREV
                     ):
                         deltamode = repository.CG_DELTAMODE_FULL
                     return storageutil.emitrevisions(
                         self,
                         nodes,
                         nodesorder,
                         revlogrevisiondelta,
                         deltaparentfn=self.deltaparent,
                         candeltafn=self._candelta,
                         rawsizefn=self.rawsize,
                         revdifffn=self.revdiff,
                         flagsfn=self.flags,
                         deltamode=deltamode,
                         revisiondata=revisiondata,
                         assumehaveparentrevisions=assumehaveparentrevisions,
                         sidedata_helpers=sidedata_helpers,
                         debug_info=debug_info,
                     )
                 DELTAREUSEALWAYS = b'always'
                 DELTAREUSESAMEREVS = b'samerevs'
                 DELTAREUSENEVER = b'never'
                 DELTAREUSEFULLADD = b'fulladd'
                 DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}
                 def clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb=None,
                     deltareuse=DELTAREUSESAMEREVS,
                     forcedeltabothparents=None,
                     sidedata_helpers=None,
                 ):
                     """Copy this revlog to another, possibly with format changes.
                     The destination revlog will contain the same revisions and nodes.
                     However, it may not be bit-for-bit identical due to e.g. delta encoding
                     differences.
                     The ``deltareuse`` argument control how deltas from the existing revlog
                     are preserved in the destination revlog. The argument can have the
                     following values:
                     DELTAREUSEALWAYS
                        Deltas will always be reused (if possible), even if the destination
                        revlog would not select the same revisions for the delta. This is the
                        fastest mode of operation.
                     DELTAREUSESAMEREVS
                        Deltas will be reused if the destination revlog would pick the same
                        revisions for the delta. This mode strikes a balance between speed
                        and optimization.
                     DELTAREUSENEVER
                        Deltas will never be reused. This is the slowest mode of execution.
                        This mode can be used to recompute deltas (e.g. if the diff/delta
                        algorithm changes).
                     DELTAREUSEFULLADD
                        Revision will be re-added as if their were new content. This is
                        slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.
                        eg: large file detection and handling.
                     Delta computation can be slow, so the choice of delta reuse policy can
                     significantly affect run time.
                     The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
                     two extremes. Deltas will be reused if they are appropriate. But if the
                     delta could choose a better revision, it will do so. This means if you
                     are converting a non-generaldelta revlog to a generaldelta revlog,
                     deltas will be recomputed if the delta's parent isn't a parent of the
                     revision.
                     In addition to the delta policy, the ``forcedeltabothparents``
                     argument controls whether to force compute deltas against both parents
                     for merges. By default, the current default is used.
                     See `revlogutil.sidedata.get_sidedata_helpers` for the doc on
                     `sidedata_helpers`.
                     """
                     if deltareuse not in self.DELTAREUSEALL:
                         raise ValueError(
                             _(b'value for deltareuse invalid: %s') % deltareuse
                         )
                     if len(destrevlog):
                         raise ValueError(_(b'destination revlog is not empty'))
                     if getattr(self, 'filteredrevs', None):
                         raise ValueError(_(b'source revlog has filtered revisions'))
                     if getattr(destrevlog, 'filteredrevs', None):
                         raise ValueError(_(b'destination revlog has filtered revisions'))
                     # lazydelta and lazydeltabase controls whether to reuse a cached delta,
                     # if possible.
                     old_delta_config = destrevlog.delta_config
                     destrevlog.delta_config = destrevlog.delta_config.copy()
                     try:
                         if deltareuse == self.DELTAREUSEALWAYS:
                             destrevlog.delta_config.lazy_delta_base = True
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSESAMEREVS:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSENEVER:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = False
                         delta_both_parents = (
                             forcedeltabothparents or old_delta_config.delta_both_parents
                         )
                         destrevlog.delta_config.delta_both_parents = delta_both_parents
                         with self.reading(), destrevlog._writing(tr):
                             self._clone(
                                 tr,
                                 destrevlog,
                                 addrevisioncb,
                                 deltareuse,
                                 forcedeltabothparents,
                                 sidedata_helpers,
                             )
                     finally:
                         destrevlog.delta_config = old_delta_config
                 def _clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb,
                     deltareuse,
                     forcedeltabothparents,
                     sidedata_helpers,
                 ):
                     """perform the core duty of `revlog.clone` after parameter processing"""
                     write_debug = None
                     if self.delta_config.debug_delta:
                         write_debug = tr._report
                     deltacomputer = deltautil.deltacomputer(
                         destrevlog,
                         write_debug=write_debug,
                     )
                     index = self.index
                     for rev in self:
                         entry = index[rev]
                         # Some classes override linkrev to take filtered revs into
                         # account. Use raw entry from index.
                         flags = entry[0] & 0xFFFF
                         linkrev = entry[4]
                         p1 = index[entry[5]][7]
                         p2 = index[entry[6]][7]
                         node = entry[7]
                         # (Possibly) reuse the delta from the revlog if allowed and
                         # the revlog chunk is a delta.
                         cachedelta = None
                         rawtext = None
                         if deltareuse == self.DELTAREUSEFULLADD:
                             text = self._revisiondata(rev)
                             sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             destrevlog.addrevision(
                                 text,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 cachedelta=cachedelta,
                                 node=node,
                                 flags=flags,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         else:
                             if destrevlog.delta_config.lazy_delta:
                                 dp = self.deltaparent(rev)
                                 if dp != nullrev:
                                     cachedelta = (dp, bytes(self._inner._chunk(rev)))
                             sidedata = None
                             if not cachedelta:
                                 try:
                                     rawtext = self._revisiondata(rev)
                                 except error.CensoredNodeError as censored:
                                     assert flags & REVIDX_ISCENSORED
                                     rawtext = censored.tombstone
                                 sidedata = self.sidedata(rev)
                             if sidedata is None:
                                 sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             destrevlog._addrevision(
                                 node,
                                 rawtext,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 flags,
                                 cachedelta,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         if addrevisioncb:
                             addrevisioncb(self, rev, node)
                 def censorrevision(self, tr, censornode, tombstone=b''):
                     if self._format_version == REVLOGV0:
                         raise error.RevlogError(
                             _(b'cannot censor with version %d revlogs')
                             % self._format_version
                         )
                     elif self._format_version == REVLOGV1:
                         rewrite.v1_censor(self, tr, censornode, tombstone)
                     else:
                         rewrite.v2_censor(self, tr, censornode, tombstone)
                 def verifyintegrity(self, state):
                     """Verifies the integrity of the revlog.
                     Yields ``revlogproblem`` instances describing problems that are
                     found.
                     """
                     dd, di = self.checksize()
                     if dd:
                         yield revlogproblem(error=_(b'data length off by %d bytes') % dd)
                     if di:
                         yield revlogproblem(error=_(b'index contains %d extra bytes') % di)
                     version = self._format_version
                     # The verifier tells us what version revlog we should be.
                     if version != state[b'expectedversion']:
                         yield revlogproblem(
                             warning=_(b"warning: '%s' uses revlog format %d; expected %d")
                             % (self.display_id, version, state[b'expectedversion'])
                         )
                     state[b'skipread'] = set()
                     state[b'safe_renamed'] = set()
                     for rev in self:
                         node = self.node(rev)
                         # Verify contents. 4 cases to care about:
                         #
                         #   common: the most common case
                         #   rename: with a rename
                         #   meta: file content starts with b'\1\n', the metadata
                         #         header defined in filelog.py, but without a rename
                         #   ext: content stored externally
                         #
                         # More formally, their differences are shown below:
                         #
                         #                       | common | rename | meta  | ext
                         #  -------------------------------------------------------
                         #   flags()             | 0      | 0      | 0     | not 0
                         #   renamed()           | False  | True   | False | ?
                         #   rawtext[0:2]=='\1\n'| False  | True   | True  | ?
                         #
                         # "rawtext" means the raw text stored in revlog data, which
                         # could be retrieved by "rawdata(rev)". "text"
                         # mentioned below is "revision(rev)".
                         #
                         # There are 3 different lengths stored physically:
                         #  1. L1: rawsize, stored in revlog index
                         #  2. L2: len(rawtext), stored in revlog data
                         #  3. L3: len(text), stored in revlog data if flags==0, or
                         #     possibly somewhere else if flags!=0
                         #
                         # L1 should be equal to L2. L3 could be different from them.
                         # "text" may or may not affect commit hash depending on flag
                         # processors (see flagutil.addflagprocessor).
                         #
                         #              | common  | rename | meta  | ext
                         # -------------------------------------------------
                         #    rawsize() | L1      | L1     | L1    | L1
                         #       size() | L1      | L2-LM  | L1(*) | L1 (?)
                         # len(rawtext) | L2      | L2     | L2    | L2
                         #    len(text) | L2      | L2     | L2    | L3
                         #  len(read()) | L2      | L2-LM  | L2-LM | L3 (?)
                         #
                         # LM:  length of metadata, depending on rawtext
                         # (*): not ideal, see comment in filelog.size
                         # (?): could be "- len(meta)" if the resolved content has
                         #      rename metadata
                         #
                         # Checks needed to be done:
                         #  1. length check: L1 == L2, in all cases.
                         #  2. hash check: depending on flag processor, we may need to
                         #     use either "text" (external), or "rawtext" (in revlog).
                         try:
                             skipflags = state.get(b'skipflags', 0)
                             if skipflags:
                                 skipflags &= self.flags(rev)
                             _verify_revision(self, skipflags, state, node)
                             l1 = self.rawsize(rev)
                             l2 = len(self.rawdata(node))
                             if l1 != l2:
                                 yield revlogproblem(
                                     error=_(b'unpacked size is %d, %d expected') % (l2, l1),
                                     node=node,
                                 )
                         except error.CensoredNodeError:
                             if state[b'erroroncensored']:
                                 yield revlogproblem(
                                     error=_(b'censored file data'), node=node
                                 )
                                 state[b'skipread'].add(node)
                         except Exception as e:
                             yield revlogproblem(
                                 error=_(b'unpacking %s: %s')
                                 % (short(node), stringutil.forcebytestr(e)),
                                 node=node,
                             )
                             state[b'skipread'].add(node)
                 def storageinfo(
                     self,
                     exclusivefiles=False,
                     sharedfiles=False,
                     revisionscount=False,
                     trackedsize=False,
                     storedsize=False,
                 ):
                     d = {}
                     if exclusivefiles:
                         d[b'exclusivefiles'] = [(self.opener, self._indexfile)]
                         if not self._inline:
                             d[b'exclusivefiles'].append((self.opener, self._datafile))
                     if sharedfiles:
                         d[b'sharedfiles'] = []
                     if revisionscount:
                         d[b'revisionscount'] = len(self)
                     if trackedsize:
                         d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))
                     if storedsize:
                         d[b'storedsize'] = sum(
                             self.opener.stat(path).st_size for path in self.files()
                         )
                     return d
                 def rewrite_sidedata(self, transaction, helpers, startrev, endrev):
                     if not self.feature_config.has_side_data:
                         return
                     # revlog formats with sidedata support does not support inline
                     assert not self._inline
                     if not helpers[1] and not helpers[2]:
                         # Nothing to generate or remove
                         return
                     new_entries = []
                     # append the new sidedata
                     with self._writing(transaction):
                         ifh, dfh, sdfh = self._inner._writinghandles
                         dfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                         current_offset = sdfh.tell()
                         for rev in range(startrev, endrev + 1):
                             entry = self.index[rev]
                             new_sidedata, flags = sidedatautil.run_sidedata_helpers(
                                 store=self,
                                 sidedata_helpers=helpers,
                                 sidedata={},
                                 rev=rev,
                             )
                             serialized_sidedata = sidedatautil.serialize_sidedata(
                                 new_sidedata
                             )
                             sidedata_compression_mode = COMP_MODE_INLINE
                             if serialized_sidedata and self.feature_config.has_side_data:
                                 sidedata_compression_mode = COMP_MODE_PLAIN
                                 h, comp_sidedata = self._inner.compress(serialized_sidedata)
                                 if (
                                     h != b'u'
                                     and comp_sidedata[0] != b'\0'
                                     and len(comp_sidedata) < len(serialized_sidedata)
                                 ):
                                     assert not h
                                     if (
                                         comp_sidedata[0]
                                         == self._docket.default_compression_header
                                     ):
                                         sidedata_compression_mode = COMP_MODE_DEFAULT
                                         serialized_sidedata = comp_sidedata
                                     else:
                                         sidedata_compression_mode = COMP_MODE_INLINE
                                         serialized_sidedata = comp_sidedata
                             if entry[8] != 0 or entry[9] != 0:
                                 # rewriting entries that already have sidedata is not
                                 # supported yet, because it introduces garbage data in the
                                 # revlog.
                                 msg = b"rewriting existing sidedata is not supported yet"
                                 raise error.Abort(msg)
                             # Apply (potential) flags to add and to remove after running
                             # the sidedata helpers
                             new_offset_flags = entry[0] | flags[0] & ~flags[1]
                             entry_update = (
                                 current_offset,
                                 len(serialized_sidedata),
                                 new_offset_flags,
                                 sidedata_compression_mode,
                             )
                             # the sidedata computation might have move the file cursors around
                             sdfh.seek(current_offset, os.SEEK_SET)
                             sdfh.write(serialized_sidedata)
                             new_entries.append(entry_update)
                             current_offset += len(serialized_sidedata)
                             self._docket.sidedata_end = sdfh.tell()
                         # rewrite the new index entries
                         ifh.seek(startrev * self.index.entry_size)
                         for i, e in enumerate(new_entries):
                             rev = startrev + i
                             self.index.replace_sidedata_info(rev, *e)
                             packed = self.index.entry_binary(rev)
                             if rev == 0 and self._docket is None:
                                 header = self._format_flags | self._format_version
                                 header = self.index.pack_header(header)
                                 packed = header + packed
                             ifh.write(packed)

             import unittest
             # picked from test-parse-index2, copied rather than imported
             # so that it stays stable even if test-parse-index2 changes or disappears.
             data_non_inlined = (
                 b'\x00\x00\x00\x01\x00\x00\x00\x00\x00\x01D\x19'
                 b'\x00\x07e\x12\x00\x00\x00\x00\x00\x00\x00\x00\xff\xff\xff\xff'
                 b'\xff\xff\xff\xff\xd1\xf4\xbb\xb0\xbe\xfc\x13\xbd\x8c\xd3\x9d'
                 b'\x0f\xcd\xd9;\x8c\x07\x8cJ/\x00\x00\x00\x00\x00\x00\x00\x00\x00'
                 b'\x00\x00\x00\x00\x00\x00\x01D\x19\x00\x00\x00\x00\x00\xdf\x00'
                 b'\x00\x01q\x00\x00\x00\x01\x00\x00\x00\x01\x00\x00\x00\x00\xff'
                 b'\xff\xff\xff\xc1\x12\xb9\x04\x96\xa4Z1t\x91\xdfsJ\x90\xf0\x9bh'
                 b'\x07l&\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00'
                 b'\x00\x01D\xf8\x00\x00\x00\x00\x01\x1b\x00\x00\x01\xb8\x00\x00'
                 b'\x00\x01\x00\x00\x00\x02\x00\x00\x00\x01\xff\xff\xff\xff\x02\n'
                 b'\x0e\xc6&\xa1\x92\xae6\x0b\x02i\xfe-\xe5\xbao\x05\xd1\xe7\x00'
                 b'\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01F'
                 b'\x13\x00\x00\x00\x00\x01\xec\x00\x00\x03\x06\x00\x00\x00\x01'
                 b'\x00\x00\x00\x03\x00\x00\x00\x02\xff\xff\xff\xff\x12\xcb\xeby1'
                 b'\xb6\r\x98B\xcb\x07\xbd`\x8f\x92\xd9\xc4\x84\xbdK\x00\x00\x00'
                 b'\x00\x00\x00\x00\x00\x00\x00\x00\x00'
             )
             from ..revlogutils.constants import REVLOGV1
             try:
                 from ..cext import parsers as cparsers  # pytype: disable=import-error
             except ImportError:
                 cparsers = None
             try:
-                from ..rustext.revlog import MixedIndex  # pytype: disable=import-error
+                from ..rustext.revlog import (  # pytype: disable=import-error
+                    Index as RustIndex,
+                )
             except ImportError:
-                MixedIndex = None
+                RustIndex = None
             @unittest.skipIf(
                 cparsers is None,
                 'The C version of the "parsers" module is not available. It is needed for this test.',
             )
             class RevlogBasedTestBase(unittest.TestCase):
                 def parseindex(self, data=None):
                     if data is None:
                         data = data_non_inlined
                     return cparsers.parse_index2(data, False)[0]
             @unittest.skipIf(
-                MixedIndex is None,
+                RustIndex is None,
                 'The Rust index is not available. It is needed for this test.',
             )
             class RustRevlogBasedTestBase(unittest.TestCase):
                 def parserustindex(self, data=None):
                     if data is None:
                         data = data_non_inlined
                     # not inheriting RevlogBasedTestCase to avoid having a
                     # `parseindex` method that would be shadowed by future subclasses
                     # this duplication will soon be removed
-                    return MixedIndex(data, REVLOGV1)
+                    return RustIndex(data, REVLOGV1)

             // revlog.rs
             //
             // Copyright 2019-2020 Georges Racinet <georges.racinet@octobus.net>
             //
             // This software may be used and distributed according to the terms of the
             // GNU General Public License version 2 or any later version.
             use crate::{
                 conversion::{rev_pyiter_collect, rev_pyiter_collect_or_else},
                 utils::{node_from_py_bytes, node_from_py_object},
                 PyRevision,
             };
             use cpython::{
                 buffer::{Element, PyBuffer},
                 exc::{IndexError, ValueError},
                 ObjectProtocol, PyBool, PyBytes, PyClone, PyDict, PyErr, PyInt, PyList,
                 PyModule, PyObject, PyResult, PySet, PyString, PyTuple, Python,
                 PythonObject, ToPyObject, UnsafePyLeaked,
             };
             use hg::{
                 errors::HgError,
                 index::{
                     IndexHeader, Phase, RevisionDataParams, SnapshotsCache,
                     INDEX_ENTRY_SIZE,
                 },
                 nodemap::{Block, NodeMapError, NodeTree as CoreNodeTree},
                 revlog::{nodemap::NodeMap, Graph, NodePrefix, RevlogError, RevlogIndex},
                 BaseRevision, Node, Revision, UncheckedRevision, NULL_REVISION,
             };
             use std::{cell::RefCell, collections::HashMap};
             use vcsgraph::graph::Graph as VCSGraph;
             pub struct PySharedIndex {
                 /// The underlying hg-core index
                 pub(crate) inner: &'static hg::index::Index,
             }
             /// Return a Struct implementing the Graph trait
             pub(crate) fn py_rust_index_to_graph(
                 py: Python,
                 index: PyObject,
             ) -> PyResult<UnsafePyLeaked<PySharedIndex>> {
-                let midx = index.extract::<MixedIndex>(py)?;
+                let midx = index.extract::<Index>(py)?;
                 let leaked = midx.index(py).leak_immutable();
                 Ok(unsafe { leaked.map(py, |idx| PySharedIndex { inner: idx }) })
             }
             impl Clone for PySharedIndex {
                 fn clone(&self) -> Self {
                     Self { inner: self.inner }
                 }
             }
             impl Graph for PySharedIndex {
                 fn parents(&self, rev: Revision) -> Result<[Revision; 2], hg::GraphError> {
                     self.inner.parents(rev)
                 }
             }
             impl VCSGraph for PySharedIndex {
                 fn parents(
                     &self,
                     rev: BaseRevision,
                 ) -> Result<vcsgraph::graph::Parents, vcsgraph::graph::GraphReadError>
                 {
                     // FIXME This trait should be reworked to decide between Revision
                     // and UncheckedRevision, get better errors names, etc.
                     match Graph::parents(self, Revision(rev)) {
                         Ok(parents) => {
                             Ok(vcsgraph::graph::Parents([parents[0].0, parents[1].0]))
                         }
                         Err(hg::GraphError::ParentOutOfRange(rev)) => {
                             Err(vcsgraph::graph::GraphReadError::KeyedInvalidKey(rev.0))
                         }
                     }
                 }
             }
             impl RevlogIndex for PySharedIndex {
                 fn len(&self) -> usize {
                     self.inner.len()
                 }
                 fn node(&self, rev: Revision) -> Option<&Node> {
                     self.inner.node(rev)
                 }
             }
-            py_class!(pub class MixedIndex |py| {
+            py_class!(pub class Index |py| {
                 @shared data index: hg::index::Index;
                 data nt: RefCell<Option<CoreNodeTree>>;
                 data docket: RefCell<Option<PyObject>>;
                 // Holds a reference to the mmap'ed persistent nodemap data
                 data nodemap_mmap: RefCell<Option<PyBuffer>>;
                 // Holds a reference to the mmap'ed persistent index data
                 data index_mmap: RefCell<Option<PyBuffer>>;
                 def __new__(
                     _cls,
                     data: PyObject,
                     default_header: u32,
-                ) -> PyResult<MixedIndex> {
+                ) -> PyResult<Self> {
                     Self::new(py, data, default_header)
                 }
                 /// Compatibility layer used for Python consumers needing access to the C index
                 ///
                 /// Only use case so far is `scmutil.shortesthexnodeidprefix`,
                 /// that may need to build a custom `nodetree`, based on a specified revset.
                 /// With a Rust implementation of the nodemap, we will be able to get rid of
                 /// this, by exposing our own standalone nodemap class,
                 /// ready to accept `Index`.
             /*    def get_cindex(&self) -> PyResult<PyObject> {
                     Ok(self.cindex(py).borrow().inner().clone_ref(py))
                 }
             */
                 // Index API involving nodemap, as defined in mercurial/pure/parsers.py
                 /// Return Revision if found, raises a bare `error.RevlogError`
                 /// in case of ambiguity, same as C version does
                 def get_rev(&self, node: PyBytes) -> PyResult<Option<PyRevision>> {
                     let opt = self.get_nodetree(py)?.borrow();
                     let nt = opt.as_ref().unwrap();
                     let ridx = &*self.index(py).borrow();
                     let node = node_from_py_bytes(py, &node)?;
                     let rust_rev =
                         nt.find_bin(ridx, node.into()).map_err(|e| nodemap_error(py, e))?;
                     Ok(rust_rev.map(Into::into))
                 }
                 /// same as `get_rev()` but raises a bare `error.RevlogError` if node
                 /// is not found.
                 ///
                 /// No need to repeat `node` in the exception, `mercurial/revlog.py`
                 /// will catch and rewrap with it
                 def rev(&self, node: PyBytes) -> PyResult<PyRevision> {
                     self.get_rev(py, node)?.ok_or_else(|| revlog_error(py))
                 }
                 /// return True if the node exist in the index
                 def has_node(&self, node: PyBytes) -> PyResult<bool> {
                     // TODO OPTIM we could avoid a needless conversion here,
                     // to do when scaffolding for pure Rust switch is removed,
                     // as `get_rev()` currently does the necessary assertions
                     self.get_rev(py, node).map(|opt| opt.is_some())
                 }
                 /// find length of shortest hex nodeid of a binary ID
                 def shortest(&self, node: PyBytes) -> PyResult<usize> {
                     let opt = self.get_nodetree(py)?.borrow();
                     let nt = opt.as_ref().unwrap();
                     let idx = &*self.index(py).borrow();
                     match nt.unique_prefix_len_node(idx, &node_from_py_bytes(py, &node)?)
                     {
                         Ok(Some(l)) => Ok(l),
                         Ok(None) => Err(revlog_error(py)),
                         Err(e) => Err(nodemap_error(py, e)),
                     }
                 }
                 def partialmatch(&self, node: PyObject) -> PyResult<Option<PyBytes>> {
                     let opt = self.get_nodetree(py)?.borrow();
                     let nt = opt.as_ref().unwrap();
                     let idx = &*self.index(py).borrow();
                     let node_as_string = if cfg!(feature = "python3-sys") {
                         node.cast_as::<PyString>(py)?.to_string(py)?.to_string()
                     }
                     else {
                         let node = node.extract::<PyBytes>(py)?;
                         String::from_utf8_lossy(node.data(py)).to_string()
                     };
                     let prefix = NodePrefix::from_hex(&node_as_string)
                         .map_err(|_| PyErr::new::<ValueError, _>(
                             py, format!("Invalid node or prefix '{}'", node_as_string))
                         )?;
                     nt.find_bin(idx, prefix)
                         // TODO make an inner API returning the node directly
                         .map(|opt| opt.map(
                             |rev| PyBytes::new(py, idx.node(rev).unwrap().as_bytes())))
                         .map_err(|e| nodemap_error(py, e))
                 }
                 /// append an index entry
                 def append(&self, tup: PyTuple) -> PyResult<PyObject> {
                     if tup.len(py) < 8 {
                         // this is better than the panic promised by tup.get_item()
                         return Err(
                             PyErr::new::<IndexError, _>(py, "tuple index out of range"))
                     }
                     let node_bytes = tup.get_item(py, 7).extract(py)?;
                     let node = node_from_py_object(py, &node_bytes)?;
                     let rev = self.len(py)? as BaseRevision;
                     // This is ok since we will just add the revision to the index
                     let rev = Revision(rev);
                     self.index(py)
                         .borrow_mut()
                         .append(py_tuple_to_revision_data_params(py, tup)?)
                         .unwrap();
                     let idx = &*self.index(py).borrow();
                     self.get_nodetree(py)?.borrow_mut().as_mut().unwrap()
                         .insert(idx, &node, rev)
                         .map_err(|e| nodemap_error(py, e))?;
                     Ok(py.None())
                 }
                 def __delitem__(&self, key: PyObject) -> PyResult<()> {
                     // __delitem__ is both for `del idx[r]` and `del idx[r1:r2]`
                     let start = if let Ok(rev) = key.extract(py) {
                         UncheckedRevision(rev)
                     } else {
                         let start = key.getattr(py, "start")?;
                         UncheckedRevision(start.extract(py)?)
                     };
                     let start = self.index(py)
                         .borrow()
                         .check_revision(start)
                         .ok_or_else(|| {
                             nodemap_error(py, NodeMapError::RevisionNotInIndex(start))
                         })?;
                     self.index(py).borrow_mut().remove(start).unwrap();
                     let mut opt = self.get_nodetree(py)?.borrow_mut();
                     let nt = opt.as_mut().unwrap();
                     nt.invalidate_all();
                     self.fill_nodemap(py, nt)?;
                     Ok(())
                 }
                 //
                 // Index methods previously reforwarded to C index (tp_methods)
                 // Same ordering as in revlog.c
                 //
                 /// return the gca set of the given revs
                 def ancestors(&self, *args, **_kw) -> PyResult<PyObject> {
                     let rust_res = self.inner_ancestors(py, args)?;
                     Ok(rust_res)
                 }
                 /// return the heads of the common ancestors of the given revs
                 def commonancestorsheads(&self, *args, **_kw) -> PyResult<PyObject> {
                     let rust_res = self.inner_commonancestorsheads(py, args)?;
                     Ok(rust_res)
                 }
                 /// Clear the index caches and inner py_class data.
                 /// It is Python's responsibility to call `update_nodemap_data` again.
                 def clearcaches(&self) -> PyResult<PyObject> {
                     self.nt(py).borrow_mut().take();
                     self.docket(py).borrow_mut().take();
                     self.nodemap_mmap(py).borrow_mut().take();
                     self.index(py).borrow().clear_caches();
                     Ok(py.None())
                 }
                 /// return the raw binary string representing a revision
                 def entry_binary(&self, *args, **_kw) -> PyResult<PyObject> {
                     let rindex = self.index(py).borrow();
                     let rev = UncheckedRevision(args.get_item(py, 0).extract(py)?);
                     let rust_bytes = rindex.check_revision(rev).and_then(
                         |r| rindex.entry_binary(r))
                         .ok_or_else(|| rev_not_in_index(py, rev))?;
                     let rust_res = PyBytes::new(py, rust_bytes).into_object();
                     Ok(rust_res)
                 }
                 /// return a binary packed version of the header
                 def pack_header(&self, *args, **_kw) -> PyResult<PyObject> {
                     let rindex = self.index(py).borrow();
                     let packed = rindex.pack_header(args.get_item(py, 0).extract(py)?);
                     let rust_res = PyBytes::new(py, &packed).into_object();
                     Ok(rust_res)
                 }
                 /// compute phases
                 def computephasesmapsets(&self, *args, **_kw) -> PyResult<PyObject> {
                     let py_roots = args.get_item(py, 0).extract::<PyDict>(py)?;
                     let rust_res = self.inner_computephasesmapsets(py, py_roots)?;
                     Ok(rust_res)
                 }
                 /// reachableroots
                 def reachableroots2(&self, *args, **_kw) -> PyResult<PyObject> {
                     let rust_res = self.inner_reachableroots2(
                         py,
                         UncheckedRevision(args.get_item(py, 0).extract(py)?),
                         args.get_item(py, 1),
                         args.get_item(py, 2),
                         args.get_item(py, 3).extract(py)?,
                     )?;
                     Ok(rust_res)
                 }
                 /// get head revisions
                 def headrevs(&self) -> PyResult<PyObject> {
                     let rust_res = self.inner_headrevs(py)?;
                     Ok(rust_res)
                 }
                 /// get filtered head revisions
                 def headrevsfiltered(&self, *args, **_kw) -> PyResult<PyObject> {
                     let rust_res = self.inner_headrevsfiltered(py, &args.get_item(py, 0))?;
                     Ok(rust_res)
                 }
                 /// True if the object is a snapshot
                 def issnapshot(&self, *args, **_kw) -> PyResult<bool> {
                     let index = self.index(py).borrow();
                     let result = index
                         .is_snapshot(UncheckedRevision(args.get_item(py, 0).extract(py)?))
                         .map_err(|e| {
                             PyErr::new::<cpython::exc::ValueError, _>(py, e.to_string())
                         })?;
                     Ok(result)
                 }
                 /// Gather snapshot data in a cache dict
                 def findsnapshots(&self, *args, **_kw) -> PyResult<PyObject> {
                     let index = self.index(py).borrow();
                     let cache: PyDict = args.get_item(py, 0).extract(py)?;
                     // this methods operates by setting new values in the cache,
                     // hence we will compare results by letting the C implementation
                     // operate over a deepcopy of the cache, and finally compare both
                     // caches.
                     let c_cache = PyDict::new(py);
                     for (k, v) in cache.items(py) {
                         c_cache.set_item(py, k, PySet::new(py, v)?)?;
                     }
                     let start_rev = UncheckedRevision(args.get_item(py, 1).extract(py)?);
                     let end_rev = UncheckedRevision(args.get_item(py, 2).extract(py)?);
                     let mut cache_wrapper = PySnapshotsCache{ py, dict: cache };
                     index.find_snapshots(
                         start_rev,
                         end_rev,
                         &mut cache_wrapper,
                     ).map_err(|_| revlog_error(py))?;
                     Ok(py.None())
                 }
                 /// determine revisions with deltas to reconstruct fulltext
                 def deltachain(&self, *args, **_kw) -> PyResult<PyObject> {
                     let index = self.index(py).borrow();
                     let rev = args.get_item(py, 0).extract::<BaseRevision>(py)?.into();
                     let stop_rev =
                         args.get_item(py, 1).extract::<Option<BaseRevision>>(py)?;
                     let rev = index.check_revision(rev).ok_or_else(|| {
                         nodemap_error(py, NodeMapError::RevisionNotInIndex(rev))
                     })?;
                     let stop_rev = if let Some(stop_rev) = stop_rev {
                         let stop_rev = UncheckedRevision(stop_rev);
                         Some(index.check_revision(stop_rev).ok_or_else(|| {
                             nodemap_error(py, NodeMapError::RevisionNotInIndex(stop_rev))
                         })?)
                     } else {None};
                     let using_general_delta = args.get_item(py, 2)
                         .extract::<Option<u32>>(py)?
                         .map(|i| i != 0);
                     let (chain, stopped) = index.delta_chain(
                         rev, stop_rev, using_general_delta
                     ).map_err(|e| {
                         PyErr::new::<cpython::exc::ValueError, _>(py, e.to_string())
                     })?;
                     let chain: Vec<_> = chain.into_iter().map(|r| r.0).collect();
                     Ok(
                         PyTuple::new(
                             py,
                             &[
                                 chain.into_py_object(py).into_object(),
                                 stopped.into_py_object(py).into_object()
                             ]
                         ).into_object()
                     )
                 }
                 /// slice planned chunk read to reach a density threshold
                 def slicechunktodensity(&self, *args, **_kw) -> PyResult<PyObject> {
                     let rust_res = self.inner_slicechunktodensity(
                         py,
                         args.get_item(py, 0),
                         args.get_item(py, 1).extract(py)?,
                         args.get_item(py, 2).extract(py)?
                     )?;
                     Ok(rust_res)
                 }
                 // index_sequence_methods and index_mapping_methods.
                 //
                 // Since we call back through the high level Python API,
                 // there's no point making a distinction between index_get
                 // and index_getitem.
                 // gracinet 2023: this above is no longer true for the pure Rust impl
                 def __len__(&self) -> PyResult<usize> {
                     self.len(py)
                 }
                 def __getitem__(&self, key: PyObject) -> PyResult<PyObject> {
                     let rust_res = self.inner_getitem(py, key.clone_ref(py))?;
                     Ok(rust_res)
                 }
                 def __contains__(&self, item: PyObject) -> PyResult<bool> {
                     // ObjectProtocol does not seem to provide contains(), so
                     // this is an equivalent implementation of the index_contains()
                     // defined in revlog.c
                     match item.extract::<i32>(py) {
                         Ok(rev) => {
                             Ok(rev >= -1 && rev < self.len(py)? as BaseRevision)
                         }
                         Err(_) => {
                             let item_bytes: PyBytes = item.extract(py)?;
                             let rust_res = self.has_node(py, item_bytes)?;
                             Ok(rust_res)
                         }
                     }
                 }
                 def nodemap_data_all(&self) -> PyResult<PyBytes> {
                     self.inner_nodemap_data_all(py)
                 }
                 def nodemap_data_incremental(&self) -> PyResult<PyObject> {
                     self.inner_nodemap_data_incremental(py)
                 }
                 def update_nodemap_data(
                     &self,
                     docket: PyObject,
                     nm_data: PyObject
                 ) -> PyResult<PyObject> {
                     self.inner_update_nodemap_data(py, docket, nm_data)
                 }
                 @property
                 def entry_size(&self) -> PyResult<PyInt> {
                     let rust_res: PyInt = INDEX_ENTRY_SIZE.to_py_object(py);
                     Ok(rust_res)
                 }
                 @property
                 def rust_ext_compat(&self) -> PyResult<PyInt> {
                     // will be entirely removed when the Rust index yet useful to
                     // implement in Rust to detangle things when removing `self.cindex`
                     let rust_res: PyInt = 1.to_py_object(py);
                     Ok(rust_res)
                 }
                 @property
                 def is_rust(&self) -> PyResult<PyBool> {
                     Ok(false.to_py_object(py))
                 }
             });
             /// Take a (potentially) mmap'ed buffer, and return the underlying Python
             /// buffer along with the Rust slice into said buffer. We need to keep the
             /// Python buffer around, otherwise we'd get a dangling pointer once the buffer
             /// is freed from Python's side.
             ///
             /// # Safety
             ///
             /// The caller must make sure that the buffer is kept around for at least as
             /// long as the slice.
             #[deny(unsafe_op_in_unsafe_fn)]
             unsafe fn mmap_keeparound(
                 py: Python,
                 data: PyObject,
             ) -> PyResult<(
                 PyBuffer,
                 Box<dyn std::ops::Deref<Target = [u8]> + Send + Sync + 'static>,
             )> {
                 let buf = PyBuffer::get(py, &data)?;
                 let len = buf.item_count();
                 // Build a slice from the mmap'ed buffer data
                 let cbuf = buf.buf_ptr();
                 let bytes = if std::mem::size_of::<u8>() == buf.item_size()
                     && buf.is_c_contiguous()
                     && u8::is_compatible_format(buf.format())
                 {
                     unsafe { std::slice::from_raw_parts(cbuf as *const u8, len) }
                 } else {
                     return Err(PyErr::new::<ValueError, _>(
                         py,
                         "Nodemap data buffer has an invalid memory representation"
                             .to_string(),
                     ));
                 };
                 Ok((buf, Box::new(bytes)))
             }
             fn py_tuple_to_revision_data_params(
                 py: Python,
                 tuple: PyTuple,
             ) -> PyResult<RevisionDataParams> {
                 if tuple.len(py) < 8 {
                     // this is better than the panic promised by tup.get_item()
                     return Err(PyErr::new::<IndexError, _>(
                         py,
                         "tuple index out of range",
                     ));
                 }
                 let offset_or_flags: u64 = tuple.get_item(py, 0).extract(py)?;
                 let node_id = tuple
                     .get_item(py, 7)
                     .extract::<PyBytes>(py)?
                     .data(py)
                     .try_into()
                     .unwrap();
                 let flags = (offset_or_flags & 0xFFFF) as u16;
                 let data_offset = offset_or_flags >> 16;
                 Ok(RevisionDataParams {
                     flags,
                     data_offset,
                     data_compressed_length: tuple.get_item(py, 1).extract(py)?,
                     data_uncompressed_length: tuple.get_item(py, 2).extract(py)?,
                     data_delta_base: tuple.get_item(py, 3).extract(py)?,
                     link_rev: tuple.get_item(py, 4).extract(py)?,
                     parent_rev_1: tuple.get_item(py, 5).extract(py)?,
                     parent_rev_2: tuple.get_item(py, 6).extract(py)?,
                     node_id,
                     ..Default::default()
                 })
             }
             fn revision_data_params_to_py_tuple(
                 py: Python,
                 params: RevisionDataParams,
             ) -> PyTuple {
                 PyTuple::new(
                     py,
                     &[
                         params.data_offset.into_py_object(py).into_object(),
                         params
                             .data_compressed_length
                             .into_py_object(py)
                             .into_object(),
                         params
                             .data_uncompressed_length
                             .into_py_object(py)
                             .into_object(),
                         params.data_delta_base.into_py_object(py).into_object(),
                         params.link_rev.into_py_object(py).into_object(),
                         params.parent_rev_1.into_py_object(py).into_object(),
                         params.parent_rev_2.into_py_object(py).into_object(),
                         PyBytes::new(py, &params.node_id)
                             .into_py_object(py)
                             .into_object(),
                         params._sidedata_offset.into_py_object(py).into_object(),
                         params
                             ._sidedata_compressed_length
                             .into_py_object(py)
                             .into_object(),
                         params
                             .data_compression_mode
                             .into_py_object(py)
                             .into_object(),
                         params
                             ._sidedata_compression_mode
                             .into_py_object(py)
                             .into_object(),
                         params._rank.into_py_object(py).into_object(),
                     ],
                 )
             }
             struct PySnapshotsCache<'p> {
                 py: Python<'p>,
                 dict: PyDict,
             }
             impl<'p> SnapshotsCache for PySnapshotsCache<'p> {
                 fn insert_for(
                     &mut self,
                     rev: BaseRevision,
                     value: BaseRevision,
                 ) -> Result<(), RevlogError> {
                     let pyvalue = value.into_py_object(self.py).into_object();
                     match self.dict.get_item(self.py, rev) {
                         Some(obj) => obj
                             .extract::<PySet>(self.py)
                             .and_then(|set| set.add(self.py, pyvalue)),
                         None => PySet::new(self.py, vec![pyvalue])
                             .and_then(|set| self.dict.set_item(self.py, rev, set)),
                     }
                     .map_err(|_| {
                         RevlogError::Other(HgError::unsupported(
                             "Error in Python caches handling",
                         ))
                     })
                 }
             }
-            impl MixedIndex {
+            impl Index {
-                fn new(py: Python, data: PyObject, header: u32) -> PyResult<MixedIndex> {
+                fn new(py: Python, data: PyObject, header: u32) -> PyResult<Self> {
                     // Safety: we keep the buffer around inside the class as `index_mmap`
                     let (buf, bytes) = unsafe { mmap_keeparound(py, data)? };
                     Self::create_instance(
                         py,
                         hg::index::Index::new(
                             bytes,
                             IndexHeader::parse(&header.to_be_bytes())
                                 .expect("default header is broken")
                                 .unwrap(),
                         )
                         .map_err(|e| {
                             revlog_error_with_msg(py, e.to_string().as_bytes())
                         })?,
                         RefCell::new(None),
                         RefCell::new(None),
                         RefCell::new(None),
                         RefCell::new(Some(buf)),
                     )
                 }
                 fn len(&self, py: Python) -> PyResult<usize> {
                     let rust_index_len = self.index(py).borrow().len();
                     Ok(rust_index_len)
                 }
                 /// This is scaffolding at this point, but it could also become
                 /// a way to start a persistent nodemap or perform a
                 /// vacuum / repack operation
                 fn fill_nodemap(
                     &self,
                     py: Python,
                     nt: &mut CoreNodeTree,
                 ) -> PyResult<PyObject> {
                     let index = self.index(py).borrow();
                     for r in 0..self.len(py)? {
                         let rev = Revision(r as BaseRevision);
                         // in this case node() won't ever return None
                         nt.insert(&*index, index.node(rev).unwrap(), rev)
                             .map_err(|e| nodemap_error(py, e))?
                     }
                     Ok(py.None())
                 }
                 fn get_nodetree<'a>(
                     &'a self,
                     py: Python<'a>,
                 ) -> PyResult<&'a RefCell<Option<CoreNodeTree>>> {
                     if self.nt(py).borrow().is_none() {
                         let readonly = Box::<Vec<_>>::default();
                         let mut nt = CoreNodeTree::load_bytes(readonly, 0);
                         self.fill_nodemap(py, &mut nt)?;
                         self.nt(py).borrow_mut().replace(nt);
                     }
                     Ok(self.nt(py))
                 }
                 /// Returns the full nodemap bytes to be written as-is to disk
                 fn inner_nodemap_data_all(&self, py: Python) -> PyResult<PyBytes> {
                     let nodemap = self.get_nodetree(py)?.borrow_mut().take().unwrap();
                     let (readonly, bytes) = nodemap.into_readonly_and_added_bytes();
                     // If there's anything readonly, we need to build the data again from
                     // scratch
                     let bytes = if readonly.len() > 0 {
                         let mut nt = CoreNodeTree::load_bytes(Box::<Vec<_>>::default(), 0);
                         self.fill_nodemap(py, &mut nt)?;
                         let (readonly, bytes) = nt.into_readonly_and_added_bytes();
                         assert_eq!(readonly.len(), 0);
                         bytes
                     } else {
                         bytes
                     };
                     let bytes = PyBytes::new(py, &bytes);
                     Ok(bytes)
                 }
                 /// Returns the last saved docket along with the size of any changed data
                 /// (in number of blocks), and said data as bytes.
                 fn inner_nodemap_data_incremental(
                     &self,
                     py: Python,
                 ) -> PyResult<PyObject> {
                     let docket = self.docket(py).borrow();
                     let docket = match docket.as_ref() {
                         Some(d) => d,
                         None => return Ok(py.None()),
                     };
                     let node_tree = self.get_nodetree(py)?.borrow_mut().take().unwrap();
                     let masked_blocks = node_tree.masked_readonly_blocks();
                     let (_, data) = node_tree.into_readonly_and_added_bytes();
                     let changed = masked_blocks * std::mem::size_of::<Block>();
                     Ok((docket, changed, PyBytes::new(py, &data))
                         .to_py_object(py)
                         .into_object())
                 }
                 /// Update the nodemap from the new (mmaped) data.
                 /// The docket is kept as a reference for later incremental calls.
                 fn inner_update_nodemap_data(
                     &self,
                     py: Python,
                     docket: PyObject,
                     nm_data: PyObject,
                 ) -> PyResult<PyObject> {
                     // Safety: we keep the buffer around inside the class as `nodemap_mmap`
                     let (buf, bytes) = unsafe { mmap_keeparound(py, nm_data)? };
                     let len = buf.item_count();
                     self.nodemap_mmap(py).borrow_mut().replace(buf);
                     let mut nt = CoreNodeTree::load_bytes(bytes, len);
                     let data_tip = docket
                         .getattr(py, "tip_rev")?
                         .extract::<BaseRevision>(py)?
                         .into();
                     self.docket(py).borrow_mut().replace(docket.clone_ref(py));
                     let idx = self.index(py).borrow();
                     let data_tip = idx.check_revision(data_tip).ok_or_else(|| {
                         nodemap_error(py, NodeMapError::RevisionNotInIndex(data_tip))
                     })?;
                     let current_tip = idx.len();
                     for r in (data_tip.0 + 1)..current_tip as BaseRevision {
                         let rev = Revision(r);
                         // in this case node() won't ever return None
                         nt.insert(&*idx, idx.node(rev).unwrap(), rev)
                             .map_err(|e| nodemap_error(py, e))?
                     }
                     *self.nt(py).borrow_mut() = Some(nt);
                     Ok(py.None())
                 }
                 fn inner_getitem(&self, py: Python, key: PyObject) -> PyResult<PyObject> {
                     let idx = self.index(py).borrow();
                     Ok(match key.extract::<BaseRevision>(py) {
                         Ok(key_as_int) => {
                             let entry_params = if key_as_int == NULL_REVISION.0 {
                                 RevisionDataParams::default()
                             } else {
                                 let rev = UncheckedRevision(key_as_int);
                                 match idx.entry_as_params(rev) {
                                     Some(e) => e,
                                     None => {
                                         return Err(PyErr::new::<IndexError, _>(
                                             py,
                                             "revlog index out of range",
                                         ));
                                     }
                                 }
                             };
                             revision_data_params_to_py_tuple(py, entry_params)
                                 .into_object()
                         }
                         _ => self.get_rev(py, key.extract::<PyBytes>(py)?)?.map_or_else(
                             || py.None(),
                             |py_rev| py_rev.into_py_object(py).into_object(),
                         ),
                     })
                 }
                 fn inner_headrevs(&self, py: Python) -> PyResult<PyObject> {
                     let index = &*self.index(py).borrow();
                     let as_vec: Vec<PyObject> = index
                         .head_revs()
                         .map_err(|e| graph_error(py, e))?
                         .iter()
                         .map(|r| PyRevision::from(*r).into_py_object(py).into_object())
                         .collect();
                     Ok(PyList::new(py, &as_vec).into_object())
                 }
                 fn inner_headrevsfiltered(
                     &self,
                     py: Python,
                     filtered_revs: &PyObject,
                 ) -> PyResult<PyObject> {
                     let index = &mut *self.index(py).borrow_mut();
                     let filtered_revs = rev_pyiter_collect(py, filtered_revs, index)?;
                     let as_vec: Vec<PyObject> = index
                         .head_revs_filtered(&filtered_revs)
                         .map_err(|e| graph_error(py, e))?
                         .iter()
                         .map(|r| PyRevision::from(*r).into_py_object(py).into_object())
                         .collect();
                     Ok(PyList::new(py, &as_vec).into_object())
                 }
                 fn inner_ancestors(
                     &self,
                     py: Python,
                     py_revs: &PyTuple,
                 ) -> PyResult<PyObject> {
                     let index = &*self.index(py).borrow();
                     let revs: Vec<_> = rev_pyiter_collect(py, py_revs.as_object(), index)?;
                     let as_vec: Vec<_> = index
                         .ancestors(&revs)
                         .map_err(|e| graph_error(py, e))?
                         .iter()
                         .map(|r| PyRevision::from(*r).into_py_object(py).into_object())
                         .collect();
                     Ok(PyList::new(py, &as_vec).into_object())
                 }
                 fn inner_commonancestorsheads(
                     &self,
                     py: Python,
                     py_revs: &PyTuple,
                 ) -> PyResult<PyObject> {
                     let index = &*self.index(py).borrow();
                     let revs: Vec<_> = rev_pyiter_collect(py, py_revs.as_object(), index)?;
                     let as_vec: Vec<_> = index
                         .common_ancestor_heads(&revs)
                         .map_err(|e| graph_error(py, e))?
                         .iter()
                         .map(|r| PyRevision::from(*r).into_py_object(py).into_object())
                         .collect();
                     Ok(PyList::new(py, &as_vec).into_object())
                 }
                 fn inner_computephasesmapsets(
                     &self,
                     py: Python,
                     py_roots: PyDict,
                 ) -> PyResult<PyObject> {
                     let index = &*self.index(py).borrow();
                     let opt = self.get_nodetree(py)?.borrow();
                     let nt = opt.as_ref().unwrap();
                     let roots: Result<HashMap<Phase, Vec<Revision>>, PyErr> = py_roots
                         .items_list(py)
                         .iter(py)
                         .map(|r| {
                             let phase = r.get_item(py, 0)?;
                             let nodes = r.get_item(py, 1)?;
                             // Transform the nodes from Python to revs here since we
                             // have access to the nodemap
                             let revs: Result<_, _> = nodes
                                 .iter(py)?
                                 .map(|node| match node?.extract::<PyBytes>(py) {
                                     Ok(py_bytes) => {
                                         let node = node_from_py_bytes(py, &py_bytes)?;
                                         nt.find_bin(index, node.into())
                                             .map_err(|e| nodemap_error(py, e))?
                                             .ok_or_else(|| revlog_error(py))
                                     }
                                     Err(e) => Err(e),
                                 })
                                 .collect();
                             let phase = Phase::try_from(phase.extract::<usize>(py)?)
                                 .map_err(|_| revlog_error(py));
                             Ok((phase?, revs?))
                         })
                         .collect();
                     let (len, phase_maps) = index
                         .compute_phases_map_sets(roots?)
                         .map_err(|e| graph_error(py, e))?;
                     // Ugly hack, but temporary
                     const IDX_TO_PHASE_NUM: [usize; 4] = [1, 2, 32, 96];
                     let py_phase_maps = PyDict::new(py);
                     for (idx, roots) in phase_maps.iter().enumerate() {
                         let phase_num = IDX_TO_PHASE_NUM[idx].into_py_object(py);
                         // OPTIM too bad we have to collect here. At least, we could
                         // reuse the same Vec and allocate it with capacity at
                         // max(len(phase_maps)
                         let roots_vec: Vec<PyInt> = roots
                             .iter()
                             .map(|r| PyRevision::from(*r).into_py_object(py))
                             .collect();
                         py_phase_maps.set_item(
                             py,
                             phase_num,
                             PySet::new(py, roots_vec)?,
                         )?;
                     }
                     Ok(PyTuple::new(
                         py,
                         &[
                             len.into_py_object(py).into_object(),
                             py_phase_maps.into_object(),
                         ],
                     )
                     .into_object())
                 }
                 fn inner_slicechunktodensity(
                     &self,
                     py: Python,
                     revs: PyObject,
                     target_density: f64,
                     min_gap_size: usize,
                 ) -> PyResult<PyObject> {
                     let index = &*self.index(py).borrow();
                     let revs: Vec<_> = rev_pyiter_collect(py, &revs, index)?;
                     let as_nested_vec =
                         index.slice_chunk_to_density(&revs, target_density, min_gap_size);
                     let mut res = Vec::with_capacity(as_nested_vec.len());
                     let mut py_chunk = Vec::new();
                     for chunk in as_nested_vec {
                         py_chunk.clear();
                         py_chunk.reserve_exact(chunk.len());
                         for rev in chunk {
                             py_chunk.push(
                                 PyRevision::from(rev).into_py_object(py).into_object(),
                             );
                         }
                         res.push(PyList::new(py, &py_chunk).into_object());
                     }
                     // This is just to do the same as C, not sure why it does this
                     if res.len() == 1 {
                         Ok(PyTuple::new(py, &res).into_object())
                     } else {
                         Ok(PyList::new(py, &res).into_object())
                     }
                 }
                 fn inner_reachableroots2(
                     &self,
                     py: Python,
                     min_root: UncheckedRevision,
                     heads: PyObject,
                     roots: PyObject,
                     include_path: bool,
                 ) -> PyResult<PyObject> {
                     let index = &*self.index(py).borrow();
                     let heads = rev_pyiter_collect_or_else(py, &heads, index, |_rev| {
                         PyErr::new::<IndexError, _>(py, "head out of range")
                     })?;
                     let roots: Result<_, _> = roots
                         .iter(py)?
                         .map(|r| {
                             r.and_then(|o| match o.extract::<PyRevision>(py) {
                                 Ok(r) => Ok(UncheckedRevision(r.0)),
                                 Err(e) => Err(e),
                             })
                         })
                         .collect();
                     let as_set = index
                         .reachable_roots(min_root, heads, roots?, include_path)
                         .map_err(|e| graph_error(py, e))?;
                     let as_vec: Vec<PyObject> = as_set
                         .iter()
                         .map(|r| PyRevision::from(*r).into_py_object(py).into_object())
                         .collect();
                     Ok(PyList::new(py, &as_vec).into_object())
                 }
             }
             py_class!(pub class NodeTree |py| {
                 data nt: RefCell<CoreNodeTree>;
                 data index: RefCell<UnsafePyLeaked<PySharedIndex>>;
                 def __new__(_cls, index: PyObject) -> PyResult<NodeTree> {
                     let index = py_rust_index_to_graph(py, index)?;
                     let nt = CoreNodeTree::default();  // in-RAM, fully mutable
                     Self::create_instance(py, RefCell::new(nt), RefCell::new(index))
                 }
                 /// Tell whether the NodeTree is still valid
                 ///
                 /// In case of mutation of the index, the given results are not
                 /// guaranteed to be correct, and in fact, the methods borrowing
                 /// the inner index would fail because of `PySharedRef` poisoning
                 /// (generation-based guard), same as iterating on a `dict` that has
                 /// been meanwhile mutated.
                 def is_invalidated(&self) -> PyResult<bool> {
                     let leaked = self.index(py).borrow();
                     let result = unsafe { leaked.try_borrow(py) };
                     // two cases for result to be an error:
                     // - the index has previously been mutably borrowed
                     // - there is currently a mutable borrow
                     // in both cases this amounts for previous results related to
                     // the index to still be valid.
                     Ok(result.is_err())
                 }
                 def insert(&self, rev: PyRevision) -> PyResult<PyObject> {
                     let leaked = self.index(py).borrow();
                     let index = &*unsafe { leaked.try_borrow(py)? };
                     let rev = UncheckedRevision(rev.0);
                     let rev = index
                         .check_revision(rev)
                         .ok_or_else(|| rev_not_in_index(py, rev))?;
                     if rev == NULL_REVISION {
                         return Err(rev_not_in_index(py, rev.into()))
                     }
                     let entry = index.inner.get_entry(rev).unwrap();
                     let mut nt = self.nt(py).borrow_mut();
                     nt.insert(index, entry.hash(), rev).map_err(|e| nodemap_error(py, e))?;
                     Ok(py.None())
                 }
                 /// Lookup by node hex prefix in the NodeTree, returning revision number.
                 ///
                 /// This is not part of the classical NodeTree API, but is good enough
                 /// for unit testing, as in `test-rust-revlog.py`.
                 def prefix_rev_lookup(
                     &self,
                     node_prefix: PyBytes
                 ) -> PyResult<Option<PyRevision>> {
                     let prefix = NodePrefix::from_hex(node_prefix.data(py))
                         .map_err(|_| PyErr::new::<ValueError, _>(
                             py,
                             format!("Invalid node or prefix {:?}",
                                     node_prefix.as_object()))
                         )?;
                     let nt = self.nt(py).borrow();
                     let leaked = self.index(py).borrow();
                     let index = &*unsafe { leaked.try_borrow(py)? };
                     Ok(nt.find_bin(index, prefix)
                            .map_err(|e| nodemap_error(py, e))?
                            .map(|r| r.into())
                     )
                 }
                 def shortest(&self, node: PyBytes) -> PyResult<usize> {
                     let nt = self.nt(py).borrow();
                     let leaked = self.index(py).borrow();
                     let idx = &*unsafe { leaked.try_borrow(py)? };
                     match nt.unique_prefix_len_node(idx, &node_from_py_bytes(py, &node)?)
                     {
                         Ok(Some(l)) => Ok(l),
                         Ok(None) => Err(revlog_error(py)),
                         Err(e) => Err(nodemap_error(py, e)),
                     }
                 }
             });
             fn revlog_error(py: Python) -> PyErr {
                 match py
                     .import("mercurial.error")
                     .and_then(|m| m.get(py, "RevlogError"))
                 {
                     Err(e) => e,
                     Ok(cls) => PyErr::from_instance(
                         py,
                         cls.call(py, (py.None(),), None).ok().into_py_object(py),
                     ),
                 }
             }
             fn revlog_error_with_msg(py: Python, msg: &[u8]) -> PyErr {
                 match py
                     .import("mercurial.error")
                     .and_then(|m| m.get(py, "RevlogError"))
                 {
                     Err(e) => e,
                     Ok(cls) => PyErr::from_instance(
                         py,
                         cls.call(py, (PyBytes::new(py, msg),), None)
                             .ok()
                             .into_py_object(py),
                     ),
                 }
             }
             fn graph_error(py: Python, _err: hg::GraphError) -> PyErr {
                 // ParentOutOfRange is currently the only alternative
                 // in `hg::GraphError`. The C index always raises this simple ValueError.
                 PyErr::new::<ValueError, _>(py, "parent out of range")
             }
             fn nodemap_rev_not_in_index(py: Python, rev: UncheckedRevision) -> PyErr {
                 PyErr::new::<ValueError, _>(
                     py,
                     format!(
                         "Inconsistency: Revision {} found in nodemap \
                          is not in revlog index",
                         rev
                     ),
                 )
             }
             fn rev_not_in_index(py: Python, rev: UncheckedRevision) -> PyErr {
                 PyErr::new::<ValueError, _>(
                     py,
                     format!("revlog index out of range: {}", rev),
                 )
             }
             /// Standard treatment of NodeMapError
             fn nodemap_error(py: Python, err: NodeMapError) -> PyErr {
                 match err {
                     NodeMapError::MultipleResults => revlog_error(py),
                     NodeMapError::RevisionNotInIndex(r) => nodemap_rev_not_in_index(py, r),
                 }
             }
             /// Create the module, with __package__ given from parent
             pub fn init_module(py: Python, package: &str) -> PyResult<PyModule> {
                 let dotted_name = &format!("{}.revlog", package);
                 let m = PyModule::new(py, dotted_name)?;
                 m.add(py, "__package__", package)?;
                 m.add(py, "__doc__", "RevLog - Rust implementations")?;
-                m.add_class::<MixedIndex>(py)?;
+                m.add_class::<Index>(py)?;
                 m.add_class::<NodeTree>(py)?;
                 let sys = PyModule::import(py, "sys")?;
                 let sys_modules: PyDict = sys.get(py, "modules")?.extract(py)?;
                 sys_modules.set_item(py, dotted_name, &m)?;
                 Ok(m)
             }

             import struct
             import unittest
             from mercurial.node import hex
             try:
                 from mercurial import rustext
                 rustext.__name__  # trigger immediate actual import
             except ImportError:
                 rustext = None
             else:
                 from mercurial.rustext import revlog
                 # this would fail already without appropriate ancestor.__package__
                 from mercurial.rustext.ancestor import LazyAncestors
             from mercurial.testing import revlog as revlogtesting
             header = struct.unpack(">I", revlogtesting.data_non_inlined[:4])[0]
             @unittest.skipIf(
                 rustext is None,
                 "rustext module revlog relies on is not available",
             )
             class RustRevlogIndexTest(revlogtesting.RevlogBasedTestBase):
                 def test_heads(self):
                     idx = self.parseindex()
-                    rustidx = revlog.MixedIndex(revlogtesting.data_non_inlined, header)
+                    rustidx = revlog.Index(revlogtesting.data_non_inlined, header)
                     self.assertEqual(rustidx.headrevs(), idx.headrevs())
                 def test_len(self):
                     idx = self.parseindex()
-                    rustidx = revlog.MixedIndex(revlogtesting.data_non_inlined, header)
+                    rustidx = revlog.Index(revlogtesting.data_non_inlined, header)
                     self.assertEqual(len(rustidx), len(idx))
                 def test_ancestors(self):
-                    rustidx = revlog.MixedIndex(revlogtesting.data_non_inlined, header)
+                    rustidx = revlog.Index(revlogtesting.data_non_inlined, header)
                     lazy = LazyAncestors(rustidx, [3], 0, True)
                     # we have two more references to the index:
                     # - in its inner iterator for __contains__ and __bool__
                     # - in the LazyAncestors instance itself (to spawn new iterators)
                     self.assertTrue(2 in lazy)
                     self.assertTrue(bool(lazy))
                     self.assertEqual(list(lazy), [3, 2, 1, 0])
                     # a second time to validate that we spawn new iterators
                     self.assertEqual(list(lazy), [3, 2, 1, 0])
                     # let's check bool for an empty one
                     self.assertFalse(LazyAncestors(rustidx, [0], 0, False))
             @unittest.skipIf(
                 rustext is None,
                 "rustext module revlog relies on is not available",
             )
             class RustRevlogNodeTreeClassTest(revlogtesting.RustRevlogBasedTestBase):
                 def test_standalone_nodetree(self):
                     idx = self.parserustindex()
                     nt = revlog.NodeTree(idx)
                     for i in range(4):
                         nt.insert(i)
                     bin_nodes = [entry[7] for entry in idx]
                     hex_nodes = [hex(n) for n in bin_nodes]
                     for i, node in enumerate(hex_nodes):
                         self.assertEqual(nt.prefix_rev_lookup(node), i)
                         self.assertEqual(nt.prefix_rev_lookup(node[:5]), i)
                     # all 4 revisions in idx (standard data set) have different
                     # first nybbles in their Node IDs,
                     # hence `nt.shortest()` should return 1 for them, except when
                     # the leading nybble is 0 (ambiguity with NULL_NODE)
                     for i, (bin_node, hex_node) in enumerate(zip(bin_nodes, hex_nodes)):
                         shortest = nt.shortest(bin_node)
                         expected = 2 if hex_node[0] == ord('0') else 1
                         self.assertEqual(shortest, expected)
                         self.assertEqual(nt.prefix_rev_lookup(hex_node[:shortest]), i)
                     # test invalidation (generation poisoning) detection
                     del idx[3]
                     self.assertTrue(nt.is_invalidated())
             if __name__ == '__main__':
                 import silenttestrunner
                 silenttestrunner.main(__name__)