upstream/mercurial-mirror Commit - r53433:98dcbe75

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

# coding: utf8

2

# coding: utf8

3

#

3

#

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

"""Storage back-end for Mercurial.

9

"""Storage back-end for Mercurial.

10

11

This provides efficient delta storage with O(1) retrieve and append

11

This provides efficient delta storage with O(1) retrieve and append

12

and O(changes) merge between branches.

12

and O(changes) merge between branches.

13

"""

13

"""

14

15

from __future__ import annotations

15

from __future__ import annotations

16

17

import binascii

17

import binascii

18

import collections

18

import collections

19

import contextlib

19

import contextlib

20

import io

20

import io

21

import os

21

import os

22

import struct

22

import struct

23

import typing

23

import typing

24

import weakref

24

import weakref

25

import zlib

25

import zlib

26

27

from typing import (

27

from typing import (

28

Iterable,

28

Iterable,

29

Iterator,

29

Iterator,

30

Optional,

30

Optional,

31

Tuple,

31

Tuple,

32

)

32

)

33

34

# import stuff from node for others to import from revlog

34

# import stuff from node for others to import from revlog

35

from .node import (

35

from .node import (

36

bin,

36

bin,

37

hex,

37

hex,

38

nullrev,

38

nullrev,

39

sha1nodeconstants,

39

sha1nodeconstants,

40

short,

40

short,

41

wdirrev,

41

wdirrev,

42

)

42

)

43

from .i18n import _

43

from .i18n import _

44

from .revlogutils.constants import (

44

from .revlogutils.constants import (

45

ALL_KINDS,

45

ALL_KINDS,

46

CHANGELOGV2,

46

CHANGELOGV2,

47

COMP_MODE_DEFAULT,

47

COMP_MODE_DEFAULT,

48

COMP_MODE_INLINE,

48

COMP_MODE_INLINE,

49

COMP_MODE_PLAIN,

49

COMP_MODE_PLAIN,

50

DELTA_BASE_REUSE_NO,

50

DELTA_BASE_REUSE_NO,

51

DELTA_BASE_REUSE_TRY,

51

DELTA_BASE_REUSE_TRY,

52

ENTRY_RANK,

52

ENTRY_RANK,

53

FEATURES_BY_VERSION,

53

FEATURES_BY_VERSION,

54

FLAG_GENERALDELTA,

54

FLAG_GENERALDELTA,

55

FLAG_INLINE_DATA,

55

FLAG_INLINE_DATA,

56

INDEX_HEADER,

56

INDEX_HEADER,

57

KIND_CHANGELOG,

57

KIND_CHANGELOG,

58

KIND_FILELOG,

58

KIND_FILELOG,

59

RANK_UNKNOWN,

59

RANK_UNKNOWN,

60

REVLOGV0,

60

REVLOGV0,

61

REVLOGV1,

61

REVLOGV1,

62

REVLOGV1_FLAGS,

62

REVLOGV1_FLAGS,

63

REVLOGV2,

63

REVLOGV2,

64

REVLOGV2_FLAGS,

64

REVLOGV2_FLAGS,

65

REVLOG_DEFAULT_FLAGS,

65

REVLOG_DEFAULT_FLAGS,

66

REVLOG_DEFAULT_FORMAT,

66

REVLOG_DEFAULT_FORMAT,

67

REVLOG_DEFAULT_VERSION,

67

REVLOG_DEFAULT_VERSION,

68

SUPPORTED_FLAGS,

68

SUPPORTED_FLAGS,

69

)

69

)

70

from .revlogutils.flagutil import (

70

from .revlogutils.flagutil import (

71

REVIDX_DEFAULT_FLAGS,

71

REVIDX_DEFAULT_FLAGS,

72

REVIDX_ELLIPSIS,

72

REVIDX_ELLIPSIS,

73

REVIDX_EXTSTORED,

73

REVIDX_EXTSTORED,

74

REVIDX_FLAGS_ORDER,

74

REVIDX_FLAGS_ORDER,

75

REVIDX_HASCOPIESINFO,

75

REVIDX_HASCOPIESINFO,

76

REVIDX_ISCENSORED,

76

REVIDX_ISCENSORED,

77

REVIDX_RAWTEXT_CHANGING_FLAGS,

77

REVIDX_RAWTEXT_CHANGING_FLAGS,

78

)

78

)

79

from .thirdparty import attr

79

from .thirdparty import attr

80

81

# Force pytype to use the non-vendored package

81

# Force pytype to use the non-vendored package

82

if typing.TYPE_CHECKING:

82

if typing.TYPE_CHECKING:

83

# noinspection PyPackageRequirements

83

# noinspection PyPackageRequirements

84

import attr

84

import attr

85

from .pure.parsers import BaseIndexObject

85

from .pure.parsers import BaseIndexObject

86

87

from . import (

87

from . import (

88

ancestor,

88

ancestor,

89

dagop,

89

dagop,

90

error,

90

error,

91

mdiff,

91

mdiff,

92

policy,

92

policy,

93

pycompat,

93

pycompat,

94

revlogutils,

94

revlogutils,

95

templatefilters,

95

templatefilters,

96

util,

96

util,

97

vfs as vfsmod,

97

vfs as vfsmod,

98

)

98

)

99

from .interfaces import (

99

from .interfaces import (

100

repository,

100

repository,

101

)

101

)

102

from .revlogutils import (

102

from .revlogutils import (

103

deltas as deltautil,

103

deltas as deltautil,

104

docket as docketutil,

104

docket as docketutil,

105

flagutil,

105

flagutil,

106

nodemap as nodemaputil,

106

nodemap as nodemaputil,

107

randomaccessfile,

107

randomaccessfile,

108

revlogv0,

108

revlogv0,

109

rewrite,

109

rewrite,

110

sidedata as sidedatautil,

110

sidedata as sidedatautil,

111

)

111

)

112

from .utils import (

112

from .utils import (

113

storageutil,

113

storageutil,

114

stringutil,

114

stringutil,

115

)

115

)

116

117

# blanked usage of all the name to prevent pyflakes constraints

117

# blanked usage of all the name to prevent pyflakes constraints

118

# We need these name available in the module for extensions.

118

# We need these name available in the module for extensions.

119

120

REVLOGV0

120

REVLOGV0

121

REVLOGV1

121

REVLOGV1

122

REVLOGV2

122

REVLOGV2

123

CHANGELOGV2

123

CHANGELOGV2

124

FLAG_INLINE_DATA

124

FLAG_INLINE_DATA

125

FLAG_GENERALDELTA

125

FLAG_GENERALDELTA

126

REVLOG_DEFAULT_FLAGS

126

REVLOG_DEFAULT_FLAGS

127

REVLOG_DEFAULT_FORMAT

127

REVLOG_DEFAULT_FORMAT

128

REVLOG_DEFAULT_VERSION

128

REVLOG_DEFAULT_VERSION

129

REVLOGV1_FLAGS

129

REVLOGV1_FLAGS

130

REVLOGV2_FLAGS

130

REVLOGV2_FLAGS

131

REVIDX_ISCENSORED

131

REVIDX_ISCENSORED

132

REVIDX_ELLIPSIS

132

REVIDX_ELLIPSIS

133

REVIDX_HASCOPIESINFO

133

REVIDX_HASCOPIESINFO

134

REVIDX_EXTSTORED

134

REVIDX_EXTSTORED

135

REVIDX_DEFAULT_FLAGS

135

REVIDX_DEFAULT_FLAGS

136

REVIDX_FLAGS_ORDER

136

REVIDX_FLAGS_ORDER

137

REVIDX_RAWTEXT_CHANGING_FLAGS

137

REVIDX_RAWTEXT_CHANGING_FLAGS

138

139

parsers = policy.importmod('parsers')

139

parsers = policy.importmod('parsers')

140

rustancestor = policy.importrust('ancestor')

140

rustancestor = policy.importrust('ancestor', pyo3=True)

141

rustdagop = policy.importrust('dagop', pyo3=True)

141

rustdagop = policy.importrust('dagop', pyo3=True)

142

rustrevlog = policy.importrust('revlog')

142

rustrevlog = policy.importrust('revlog')

143

144

# Aliased for performance.

144

# Aliased for performance.

145

_zlibdecompress = zlib.decompress

145

_zlibdecompress = zlib.decompress

146

147

# max size of inline data embedded into a revlog

147

# max size of inline data embedded into a revlog

148

_maxinline = 131072

148

_maxinline = 131072

149

150

151

# Flag processors for REVIDX_ELLIPSIS.

151

# Flag processors for REVIDX_ELLIPSIS.

152

def ellipsisreadprocessor(rl, text):

152

def ellipsisreadprocessor(rl, text):

153

return text, False

153

return text, False

154

155

156

def ellipsiswriteprocessor(rl, text):

156

def ellipsiswriteprocessor(rl, text):

157

return text, False

157

return text, False

158

159

160

def ellipsisrawprocessor(rl, text):

160

def ellipsisrawprocessor(rl, text):

161

return False

161

return False

162

163

164

ellipsisprocessor = (

164

ellipsisprocessor = (

165

ellipsisreadprocessor,

165

ellipsisreadprocessor,

166

ellipsiswriteprocessor,

166

ellipsiswriteprocessor,

167

ellipsisrawprocessor,

167

ellipsisrawprocessor,

168

)

168

)

169

170

171

def _verify_revision(rl, skipflags, state, node):

171

def _verify_revision(rl, skipflags, state, node):

172

"""Verify the integrity of the given revlog ``node`` while providing a hook

172

"""Verify the integrity of the given revlog ``node`` while providing a hook

173

point for extensions to influence the operation."""

173

point for extensions to influence the operation."""

174

if skipflags:

174

if skipflags:

175

state[b'skipread'].add(node)

175

state[b'skipread'].add(node)

176

else:

176

else:

177

# Side-effect: read content and verify hash.

177

# Side-effect: read content and verify hash.

178

rl.revision(node)

178

rl.revision(node)

179

180

181

# True if a fast implementation for persistent-nodemap is available

181

# True if a fast implementation for persistent-nodemap is available

182

#

182

#

183

# We also consider we have a "fast" implementation in "pure" python because

183

# We also consider we have a "fast" implementation in "pure" python because

184

# people using pure don't really have performance consideration (and a

184

# people using pure don't really have performance consideration (and a

185

# wheelbarrow of other slowness source)

185

# wheelbarrow of other slowness source)

186

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

186

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

187

parsers, 'BaseIndexObject'

187

parsers, 'BaseIndexObject'

188

)

188

)

189

190

191

@attr.s(slots=True)

191

@attr.s(slots=True)

192

class revlogrevisiondelta(repository.irevisiondelta):

192

class revlogrevisiondelta(repository.irevisiondelta):

193

node = attr.ib(type=bytes)

193

node = attr.ib(type=bytes)

194

p1node = attr.ib(type=bytes)

194

p1node = attr.ib(type=bytes)

195

p2node = attr.ib(type=bytes)

195

p2node = attr.ib(type=bytes)

196

basenode = attr.ib(type=bytes)

196

basenode = attr.ib(type=bytes)

197

flags = attr.ib(type=int)

197

flags = attr.ib(type=int)

198

baserevisionsize = attr.ib(type=Optional[int])

198

baserevisionsize = attr.ib(type=Optional[int])

199

revision = attr.ib(type=Optional[bytes])

199

revision = attr.ib(type=Optional[bytes])

200

delta = attr.ib(type=Optional[bytes])

200

delta = attr.ib(type=Optional[bytes])

201

sidedata = attr.ib(type=Optional[bytes])

201

sidedata = attr.ib(type=Optional[bytes])

202

protocol_flags = attr.ib(type=int)

202

protocol_flags = attr.ib(type=int)

203

linknode = attr.ib(default=None, type=Optional[bytes])

203

linknode = attr.ib(default=None, type=Optional[bytes])

204

205

206

@attr.s(frozen=True)

206

@attr.s(frozen=True)

207

class revlogproblem(repository.iverifyproblem):

207

class revlogproblem(repository.iverifyproblem):

208

warning = attr.ib(default=None, type=Optional[bytes])

208

warning = attr.ib(default=None, type=Optional[bytes])

209

error = attr.ib(default=None, type=Optional[bytes])

209

error = attr.ib(default=None, type=Optional[bytes])

210

node = attr.ib(default=None, type=Optional[bytes])

210

node = attr.ib(default=None, type=Optional[bytes])

211

212

213

def parse_index_v1(data, inline):

213

def parse_index_v1(data, inline):

214

# call the C implementation to parse the index data

214

# call the C implementation to parse the index data

215

index, cache = parsers.parse_index2(data, inline)

215

index, cache = parsers.parse_index2(data, inline)

216

return index, cache

216

return index, cache

217

218

219

def parse_index_v2(data, inline):

219

def parse_index_v2(data, inline):

220

# call the C implementation to parse the index data

220

# call the C implementation to parse the index data

221

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

221

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

222

return index, cache

222

return index, cache

223

224

225

def parse_index_cl_v2(data, inline):

225

def parse_index_cl_v2(data, inline):

226

# call the C implementation to parse the index data

226

# call the C implementation to parse the index data

227

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

227

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

228

return index, cache

228

return index, cache

229

230

231

if hasattr(parsers, 'parse_index_devel_nodemap'):

231

if hasattr(parsers, 'parse_index_devel_nodemap'):

232

233

def parse_index_v1_nodemap(data, inline):

233

def parse_index_v1_nodemap(data, inline):

234

index, cache = parsers.parse_index_devel_nodemap(data, inline)

234

index, cache = parsers.parse_index_devel_nodemap(data, inline)

235

return index, cache

235

return index, cache

236

237

else:

237

else:

238

parse_index_v1_nodemap = None

238

parse_index_v1_nodemap = None

239

240

241

def parse_index_v1_rust(data, inline, default_header):

241

def parse_index_v1_rust(data, inline, default_header):

242

cache = (0, data) if inline else None

242

cache = (0, data) if inline else None

243

return rustrevlog.Index(data, default_header), cache

243

return rustrevlog.Index(data, default_header), cache

244

245

246

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

246

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

247

# signed integer)

247

# signed integer)

248

_maxentrysize = 0x7FFFFFFF

248

_maxentrysize = 0x7FFFFFFF

249

250

FILE_TOO_SHORT_MSG = _(

250

FILE_TOO_SHORT_MSG = _(

251

b'cannot read from revlog %s;'

251

b'cannot read from revlog %s;'

252

b' expected %d bytes from offset %d, data size is %d'

252

b' expected %d bytes from offset %d, data size is %d'

253

)

253

)

254

255

hexdigits = b'0123456789abcdefABCDEF'

255

hexdigits = b'0123456789abcdefABCDEF'

256

257

258

class _Config:

258

class _Config:

259

def copy(self):

259

def copy(self):

260

return self.__class__(**self.__dict__)

260

return self.__class__(**self.__dict__)

261

262

263

@attr.s()

263

@attr.s()

264

class FeatureConfig(_Config):

264

class FeatureConfig(_Config):

265

"""Hold configuration values about the available revlog features"""

265

"""Hold configuration values about the available revlog features"""

266

267

# the default compression engine

267

# the default compression engine

268

compression_engine = attr.ib(default=b'zlib')

268

compression_engine = attr.ib(default=b'zlib')

269

# compression engines options

269

# compression engines options

270

compression_engine_options = attr.ib(default=attr.Factory(dict))

270

compression_engine_options = attr.ib(default=attr.Factory(dict))

271

272

# can we use censor on this revlog

272

# can we use censor on this revlog

273

censorable = attr.ib(default=False)

273

censorable = attr.ib(default=False)

274

# does this revlog use the "side data" feature

274

# does this revlog use the "side data" feature

275

has_side_data = attr.ib(default=False)

275

has_side_data = attr.ib(default=False)

276

# might remove rank configuration once the computation has no impact

276

# might remove rank configuration once the computation has no impact

277

compute_rank = attr.ib(default=False)

277

compute_rank = attr.ib(default=False)

278

# parent order is supposed to be semantically irrelevant, so we

278

# parent order is supposed to be semantically irrelevant, so we

279

# normally resort parents to ensure that the first parent is non-null,

279

# normally resort parents to ensure that the first parent is non-null,

280

# if there is a non-null parent at all.

280

# if there is a non-null parent at all.

281

# filelog abuses the parent order as flag to mark some instances of

281

# filelog abuses the parent order as flag to mark some instances of

282

# meta-encoded files, so allow it to disable this behavior.

282

# meta-encoded files, so allow it to disable this behavior.

283

canonical_parent_order = attr.ib(default=False)

283

canonical_parent_order = attr.ib(default=False)

284

# can ellipsis commit be used

284

# can ellipsis commit be used

285

enable_ellipsis = attr.ib(default=False)

285

enable_ellipsis = attr.ib(default=False)

286

287

def copy(self):

287

def copy(self):

288

new = super().copy()

288

new = super().copy()

289

new.compression_engine_options = self.compression_engine_options.copy()

289

new.compression_engine_options = self.compression_engine_options.copy()

290

return new

290

return new

291

292

293

@attr.s()

293

@attr.s()

294

class DataConfig(_Config):

294

class DataConfig(_Config):

295

"""Hold configuration value about how the revlog data are read"""

295

"""Hold configuration value about how the revlog data are read"""

296

297

# should we try to open the "pending" version of the revlog

297

# should we try to open the "pending" version of the revlog

298

try_pending = attr.ib(default=False)

298

try_pending = attr.ib(default=False)

299

# should we try to open the "splitted" version of the revlog

299

# should we try to open the "splitted" version of the revlog

300

try_split = attr.ib(default=False)

300

try_split = attr.ib(default=False)

301

# When True, indexfile should be opened with checkambig=True at writing,

301

# When True, indexfile should be opened with checkambig=True at writing,

302

# to avoid file stat ambiguity.

302

# to avoid file stat ambiguity.

303

check_ambig = attr.ib(default=False)

303

check_ambig = attr.ib(default=False)

304

305

# If true, use mmap instead of reading to deal with large index

305

# If true, use mmap instead of reading to deal with large index

306

mmap_large_index = attr.ib(default=False)

306

mmap_large_index = attr.ib(default=False)

307

# how much data is large

307

# how much data is large

308

mmap_index_threshold = attr.ib(default=None)

308

mmap_index_threshold = attr.ib(default=None)

309

# How much data to read and cache into the raw revlog data cache.

309

# How much data to read and cache into the raw revlog data cache.

310

chunk_cache_size = attr.ib(default=65536)

310

chunk_cache_size = attr.ib(default=65536)

311

312

# The size of the uncompressed cache compared to the largest revision seen.

312

# The size of the uncompressed cache compared to the largest revision seen.

313

uncompressed_cache_factor = attr.ib(default=None)

313

uncompressed_cache_factor = attr.ib(default=None)

314

315

# The number of chunk cached

315

# The number of chunk cached

316

uncompressed_cache_count = attr.ib(default=None)

316

uncompressed_cache_count = attr.ib(default=None)

317

318

# Allow sparse reading of the revlog data

318

# Allow sparse reading of the revlog data

319

with_sparse_read = attr.ib(default=False)

319

with_sparse_read = attr.ib(default=False)

320

# minimal density of a sparse read chunk

320

# minimal density of a sparse read chunk

321

sr_density_threshold = attr.ib(default=0.50)

321

sr_density_threshold = attr.ib(default=0.50)

322

# minimal size of data we skip when performing sparse read

322

# minimal size of data we skip when performing sparse read

323

sr_min_gap_size = attr.ib(default=262144)

323

sr_min_gap_size = attr.ib(default=262144)

324

325

# are delta encoded against arbitrary bases.

325

# are delta encoded against arbitrary bases.

326

generaldelta = attr.ib(default=False)

326

generaldelta = attr.ib(default=False)

327

328

329

@attr.s()

329

@attr.s()

330

class DeltaConfig(_Config):

330

class DeltaConfig(_Config):

331

"""Hold configuration value about how new delta are computed

331

"""Hold configuration value about how new delta are computed

332

333

Some attributes are duplicated from DataConfig to help havign each object

333

Some attributes are duplicated from DataConfig to help havign each object

334

self contained.

334

self contained.

335

"""

335

"""

336

337

# can delta be encoded against arbitrary bases.

337

# can delta be encoded against arbitrary bases.

338

general_delta = attr.ib(default=False)

338

general_delta = attr.ib(default=False)

339

# Allow sparse writing of the revlog data

339

# Allow sparse writing of the revlog data

340

sparse_revlog = attr.ib(default=False)

340

sparse_revlog = attr.ib(default=False)

341

# maximum length of a delta chain

341

# maximum length of a delta chain

342

max_chain_len = attr.ib(default=None)

342

max_chain_len = attr.ib(default=None)

343

# Maximum distance between delta chain base start and end

343

# Maximum distance between delta chain base start and end

344

max_deltachain_span = attr.ib(default=-1)

344

max_deltachain_span = attr.ib(default=-1)

345

# If `upper_bound_comp` is not None, this is the expected maximal gain from

345

# If `upper_bound_comp` is not None, this is the expected maximal gain from

346

# compression for the data content.

346

# compression for the data content.

347

upper_bound_comp = attr.ib(default=None)

347

upper_bound_comp = attr.ib(default=None)

348

# Should we try a delta against both parent

348

# Should we try a delta against both parent

349

delta_both_parents = attr.ib(default=True)

349

delta_both_parents = attr.ib(default=True)

350

# Test delta base candidate group by chunk of this maximal size.

350

# Test delta base candidate group by chunk of this maximal size.

351

candidate_group_chunk_size = attr.ib(default=0)

351

candidate_group_chunk_size = attr.ib(default=0)

352

# Should we display debug information about delta computation

352

# Should we display debug information about delta computation

353

debug_delta = attr.ib(default=False)

353

debug_delta = attr.ib(default=False)

354

# trust incoming delta by default

354

# trust incoming delta by default

355

lazy_delta = attr.ib(default=True)

355

lazy_delta = attr.ib(default=True)

356

# trust the base of incoming delta by default

356

# trust the base of incoming delta by default

357

lazy_delta_base = attr.ib(default=False)

357

lazy_delta_base = attr.ib(default=False)

358

359

360

class _InnerRevlog:

360

class _InnerRevlog:

361

"""An inner layer of the revlog object

361

"""An inner layer of the revlog object

362

363

That layer exist to be able to delegate some operation to Rust, its

363

That layer exist to be able to delegate some operation to Rust, its

364

boundaries are arbitrary and based on what we can delegate to Rust.

364

boundaries are arbitrary and based on what we can delegate to Rust.

365

"""

365

"""

366

367

opener: vfsmod.vfs

367

opener: vfsmod.vfs

368

369

def __init__(

369

def __init__(

370

self,

370

self,

371

opener: vfsmod.vfs,

371

opener: vfsmod.vfs,

372

index,

372

index,

373

index_file,

373

index_file,

374

data_file,

374

data_file,

375

sidedata_file,

375

sidedata_file,

376

inline,

376

inline,

377

data_config,

377

data_config,

378

delta_config,

378

delta_config,

379

feature_config,

379

feature_config,

380

chunk_cache,

380

chunk_cache,

381

default_compression_header,

381

default_compression_header,

382

):

382

):

383

self.opener = opener

383

self.opener = opener

384

self.index: BaseIndexObject = index

384

self.index: BaseIndexObject = index

385

386

self.index_file = index_file

386

self.index_file = index_file

387

self.data_file = data_file

387

self.data_file = data_file

388

self.sidedata_file = sidedata_file

388

self.sidedata_file = sidedata_file

389

self.inline = inline

389

self.inline = inline

390

self.data_config = data_config

390

self.data_config = data_config

391

self.delta_config = delta_config

391

self.delta_config = delta_config

392

self.feature_config = feature_config

392

self.feature_config = feature_config

393

394

# used during diverted write.

394

# used during diverted write.

395

self._orig_index_file = None

395

self._orig_index_file = None

396

397

self._default_compression_header = default_compression_header

397

self._default_compression_header = default_compression_header

398

399

# index

399

# index

400

401

# 3-tuple of file handles being used for active writing.

401

# 3-tuple of file handles being used for active writing.

402

self._writinghandles = None

402

self._writinghandles = None

403

404

self._segmentfile = randomaccessfile.randomaccessfile(

404

self._segmentfile = randomaccessfile.randomaccessfile(

405

self.opener,

405

self.opener,

406

(self.index_file if self.inline else self.data_file),

406

(self.index_file if self.inline else self.data_file),

407

self.data_config.chunk_cache_size,

407

self.data_config.chunk_cache_size,

408

chunk_cache,

408

chunk_cache,

409

)

409

)

410

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

410

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

411

self.opener,

411

self.opener,

412

self.sidedata_file,

412

self.sidedata_file,

413

self.data_config.chunk_cache_size,

413

self.data_config.chunk_cache_size,

414

)

414

)

415

416

# revlog header -> revlog compressor

416

# revlog header -> revlog compressor

417

self._decompressors = {}

417

self._decompressors = {}

418

# 3-tuple of (node, rev, text) for a raw revision.

418

# 3-tuple of (node, rev, text) for a raw revision.

419

self._revisioncache = None

419

self._revisioncache = None

420

421

# cache some uncompressed chunks

421

# cache some uncompressed chunks

422

# rev → uncompressed_chunk

422

# rev → uncompressed_chunk

423

#

423

#

424

# the max cost is dynamically updated to be proportionnal to the

424

# the max cost is dynamically updated to be proportionnal to the

425

# size of revision we actually encounter.

425

# size of revision we actually encounter.

426

self._uncompressed_chunk_cache = None

426

self._uncompressed_chunk_cache = None

427

if self.data_config.uncompressed_cache_factor is not None:

427

if self.data_config.uncompressed_cache_factor is not None:

428

self._uncompressed_chunk_cache = util.lrucachedict(

428

self._uncompressed_chunk_cache = util.lrucachedict(

429

self.data_config.uncompressed_cache_count,

429

self.data_config.uncompressed_cache_count,

430

maxcost=65536, # some arbitrary initial value

430

maxcost=65536, # some arbitrary initial value

431

)

431

)

432

433

self._delay_buffer = None

433

self._delay_buffer = None

434

435

def __len__(self):

435

def __len__(self):

436

return len(self.index)

436

return len(self.index)

437

438

def clear_cache(self):

438

def clear_cache(self):

439

assert not self.is_delaying

439

assert not self.is_delaying

440

self._revisioncache = None

440

self._revisioncache = None

441

if self._uncompressed_chunk_cache is not None:

441

if self._uncompressed_chunk_cache is not None:

442

self._uncompressed_chunk_cache.clear()

442

self._uncompressed_chunk_cache.clear()

443

self._segmentfile.clear_cache()

443

self._segmentfile.clear_cache()

444

self._segmentfile_sidedata.clear_cache()

444

self._segmentfile_sidedata.clear_cache()

445

446

@property

446

@property

447

def canonical_index_file(self):

447

def canonical_index_file(self):

448

if self._orig_index_file is not None:

448

if self._orig_index_file is not None:

449

return self._orig_index_file

449

return self._orig_index_file

450

return self.index_file

450

return self.index_file

451

452

@property

452

@property

453

def is_delaying(self):

453

def is_delaying(self):

454

"""is the revlog is currently delaying the visibility of written data?

454

"""is the revlog is currently delaying the visibility of written data?

455

456

The delaying mechanism can be either in-memory or written on disk in a

456

The delaying mechanism can be either in-memory or written on disk in a

457

side-file."""

457

side-file."""

458

return (self._delay_buffer is not None) or (

458

return (self._delay_buffer is not None) or (

459

self._orig_index_file is not None

459

self._orig_index_file is not None

460

)

460

)

461

462

# Derived from index values.

462

# Derived from index values.

463

464

def start(self, rev):

464

def start(self, rev):

465

"""the offset of the data chunk for this revision"""

465

"""the offset of the data chunk for this revision"""

466

return int(self.index[rev][0] >> 16)

466

return int(self.index[rev][0] >> 16)

467

468

def length(self, rev):

468

def length(self, rev):

469

"""the length of the data chunk for this revision"""

469

"""the length of the data chunk for this revision"""

470

return self.index[rev][1]

470

return self.index[rev][1]

471

472

def end(self, rev):

472

def end(self, rev):

473

"""the end of the data chunk for this revision"""

473

"""the end of the data chunk for this revision"""

474

return self.start(rev) + self.length(rev)

474

return self.start(rev) + self.length(rev)

475

476

def deltaparent(self, rev):

476

def deltaparent(self, rev):

477

"""return deltaparent of the given revision"""

477

"""return deltaparent of the given revision"""

478

base = self.index[rev][3]

478

base = self.index[rev][3]

479

if base == rev:

479

if base == rev:

480

return nullrev

480

return nullrev

481

elif self.delta_config.general_delta:

481

elif self.delta_config.general_delta:

482

return base

482

return base

483

else:

483

else:

484

return rev - 1

484

return rev - 1

485

486

def issnapshot(self, rev):

486

def issnapshot(self, rev):

487

"""tells whether rev is a snapshot"""

487

"""tells whether rev is a snapshot"""

488

if not self.delta_config.sparse_revlog:

488

if not self.delta_config.sparse_revlog:

489

return self.deltaparent(rev) == nullrev

489

return self.deltaparent(rev) == nullrev

490

elif hasattr(self.index, 'issnapshot'):

490

elif hasattr(self.index, 'issnapshot'):

491

# directly assign the method to cache the testing and access

491

# directly assign the method to cache the testing and access

492

self.issnapshot = self.index.issnapshot

492

self.issnapshot = self.index.issnapshot

493

return self.issnapshot(rev)

493

return self.issnapshot(rev)

494

if rev == nullrev:

494

if rev == nullrev:

495

return True

495

return True

496

entry = self.index[rev]

496

entry = self.index[rev]

497

base = entry[3]

497

base = entry[3]

498

if base == rev:

498

if base == rev:

499

return True

499

return True

500

if base == nullrev:

500

if base == nullrev:

501

return True

501

return True

502

p1 = entry[5]

502

p1 = entry[5]

503

while self.length(p1) == 0:

503

while self.length(p1) == 0:

504

b = self.deltaparent(p1)

504

b = self.deltaparent(p1)

505

if b == p1:

505

if b == p1:

506

break

506

break

507

p1 = b

507

p1 = b

508

p2 = entry[6]

508

p2 = entry[6]

509

while self.length(p2) == 0:

509

while self.length(p2) == 0:

510

b = self.deltaparent(p2)

510

b = self.deltaparent(p2)

511

if b == p2:

511

if b == p2:

512

break

512

break

513

p2 = b

513

p2 = b

514

if base == p1 or base == p2:

514

if base == p1 or base == p2:

515

return False

515

return False

516

return self.issnapshot(base)

516

return self.issnapshot(base)

517

518

def _deltachain(self, rev, stoprev=None):

518

def _deltachain(self, rev, stoprev=None):

519

"""Obtain the delta chain for a revision.

519

"""Obtain the delta chain for a revision.

520

521

``stoprev`` specifies a revision to stop at. If not specified, we

521

``stoprev`` specifies a revision to stop at. If not specified, we

522

stop at the base of the chain.

522

stop at the base of the chain.

523

524

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

524

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

525

revs in ascending order and ``stopped`` is a bool indicating whether

525

revs in ascending order and ``stopped`` is a bool indicating whether

526

``stoprev`` was hit.

526

``stoprev`` was hit.

527

"""

527

"""

528

generaldelta = self.delta_config.general_delta

528

generaldelta = self.delta_config.general_delta

529

# Try C implementation.

529

# Try C implementation.

530

try:

530

try:

531

return self.index.deltachain(

531

return self.index.deltachain(

532

rev, stoprev, generaldelta

532

rev, stoprev, generaldelta

533

) # pytype: disable=attribute-error

533

) # pytype: disable=attribute-error

534

except AttributeError:

534

except AttributeError:

535

pass

535

pass

536

537

chain = []

537

chain = []

538

539

# Alias to prevent attribute lookup in tight loop.

539

# Alias to prevent attribute lookup in tight loop.

540

index = self.index

540

index = self.index

541

542

iterrev = rev

542

iterrev = rev

543

e = index[iterrev]

543

e = index[iterrev]

544

while iterrev != e[3] and iterrev != stoprev:

544

while iterrev != e[3] and iterrev != stoprev:

545

chain.append(iterrev)

545

chain.append(iterrev)

546

if generaldelta:

546

if generaldelta:

547

iterrev = e[3]

547

iterrev = e[3]

548

else:

548

else:

549

iterrev -= 1

549

iterrev -= 1

550

e = index[iterrev]

550

e = index[iterrev]

551

552

if iterrev == stoprev:

552

if iterrev == stoprev:

553

stopped = True

553

stopped = True

554

else:

554

else:

555

chain.append(iterrev)

555

chain.append(iterrev)

556

stopped = False

556

stopped = False

557

558

chain.reverse()

558

chain.reverse()

559

return chain, stopped

559

return chain, stopped

560

561

@util.propertycache

561

@util.propertycache

562

def _compressor(self):

562

def _compressor(self):

563

engine = util.compengines[self.feature_config.compression_engine]

563

engine = util.compengines[self.feature_config.compression_engine]

564

return engine.revlogcompressor(

564

return engine.revlogcompressor(

565

self.feature_config.compression_engine_options

565

self.feature_config.compression_engine_options

566

)

566

)

567

568

@util.propertycache

568

@util.propertycache

569

def _decompressor(self):

569

def _decompressor(self):

570

"""the default decompressor"""

570

"""the default decompressor"""

571

if self._default_compression_header is None:

571

if self._default_compression_header is None:

572

return None

572

return None

573

t = self._default_compression_header

573

t = self._default_compression_header

574

c = self._get_decompressor(t)

574

c = self._get_decompressor(t)

575

return c.decompress

575

return c.decompress

576

577

def _get_decompressor(self, t: bytes):

577

def _get_decompressor(self, t: bytes):

578

try:

578

try:

579

compressor = self._decompressors[t]

579

compressor = self._decompressors[t]

580

except KeyError:

580

except KeyError:

581

try:

581

try:

582

engine = util.compengines.forrevlogheader(t)

582

engine = util.compengines.forrevlogheader(t)

583

compressor = engine.revlogcompressor(

583

compressor = engine.revlogcompressor(

584

self.feature_config.compression_engine_options

584

self.feature_config.compression_engine_options

585

)

585

)

586

self._decompressors[t] = compressor

586

self._decompressors[t] = compressor

587

except KeyError:

587

except KeyError:

588

raise error.RevlogError(

588

raise error.RevlogError(

589

_(b'unknown compression type %s') % binascii.hexlify(t)

589

_(b'unknown compression type %s') % binascii.hexlify(t)

590

)

590

)

591

return compressor

591

return compressor

592

593

def compress(self, data: bytes) -> Tuple[bytes, bytes]:

593

def compress(self, data: bytes) -> Tuple[bytes, bytes]:

594

"""Generate a possibly-compressed representation of data."""

594

"""Generate a possibly-compressed representation of data."""

595

if not data:

595

if not data:

596

return b'', data

596

return b'', data

597

598

compressed = self._compressor.compress(data)

598

compressed = self._compressor.compress(data)

599

600

if compressed:

600

if compressed:

601

# The revlog compressor added the header in the returned data.

601

# The revlog compressor added the header in the returned data.

602

return b'', compressed

602

return b'', compressed

603

604

if data[0:1] == b'\0':

604

if data[0:1] == b'\0':

605

return b'', data

605

return b'', data

606

return b'u', data

606

return b'u', data

607

608

def decompress(self, data: bytes):

608

def decompress(self, data: bytes):

609

"""Decompress a revlog chunk.

609

"""Decompress a revlog chunk.

610

611

The chunk is expected to begin with a header identifying the

611

The chunk is expected to begin with a header identifying the

612

format type so it can be routed to an appropriate decompressor.

612

format type so it can be routed to an appropriate decompressor.

613

"""

613

"""

614

if not data:

614

if not data:

615

return data

615

return data

616

617

# Revlogs are read much more frequently than they are written and many

617

# Revlogs are read much more frequently than they are written and many

618

# chunks only take microseconds to decompress, so performance is

618

# chunks only take microseconds to decompress, so performance is

619

# important here.

619

# important here.

620

#

620

#

621

# We can make a few assumptions about revlogs:

621

# We can make a few assumptions about revlogs:

622

#

622

#

623

# 1) the majority of chunks will be compressed (as opposed to inline

623

# 1) the majority of chunks will be compressed (as opposed to inline

624

# raw data).

624

# raw data).

625

# 2) decompressing *any* data will likely by at least 10x slower than

625

# 2) decompressing *any* data will likely by at least 10x slower than

626

# returning raw inline data.

626

# returning raw inline data.

627

# 3) we want to prioritize common and officially supported compression

627

# 3) we want to prioritize common and officially supported compression

628

# engines

628

# engines

629

#

629

#

630

# It follows that we want to optimize for "decompress compressed data

630

# It follows that we want to optimize for "decompress compressed data

631

# when encoded with common and officially supported compression engines"

631

# when encoded with common and officially supported compression engines"

632

# case over "raw data" and "data encoded by less common or non-official

632

# case over "raw data" and "data encoded by less common or non-official

633

# compression engines." That is why we have the inline lookup first

633

# compression engines." That is why we have the inline lookup first

634

# followed by the compengines lookup.

634

# followed by the compengines lookup.

635

#

635

#

636

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

636

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

637

# compressed chunks. And this matters for changelog and manifest reads.

637

# compressed chunks. And this matters for changelog and manifest reads.

638

t = data[0:1]

638

t = data[0:1]

639

640

if t == b'x':

640

if t == b'x':

641

try:

641

try:

642

return _zlibdecompress(data)

642

return _zlibdecompress(data)

643

except zlib.error as e:

643

except zlib.error as e:

644

raise error.RevlogError(

644

raise error.RevlogError(

645

_(b'revlog decompress error: %s')

645

_(b'revlog decompress error: %s')

646

% stringutil.forcebytestr(e)

646

% stringutil.forcebytestr(e)

647

)

647

)

648

# '\0' is more common than 'u' so it goes first.

648

# '\0' is more common than 'u' so it goes first.

649

elif t == b'\0':

649

elif t == b'\0':

650

return data

650

return data

651

elif t == b'u':

651

elif t == b'u':

652

return util.buffer(data, 1)

652

return util.buffer(data, 1)

653

654

compressor = self._get_decompressor(t)

654

compressor = self._get_decompressor(t)

655

656

return compressor.decompress(data)

656

return compressor.decompress(data)

657

658

@contextlib.contextmanager

658

@contextlib.contextmanager

659

def reading(self):

659

def reading(self):

660

"""Context manager that keeps data and sidedata files open for reading"""

660

"""Context manager that keeps data and sidedata files open for reading"""

661

if len(self.index) == 0:

661

if len(self.index) == 0:

662

yield # nothing to be read

662

yield # nothing to be read

663

elif self._delay_buffer is not None and self.inline:

663

elif self._delay_buffer is not None and self.inline:

664

msg = "revlog with delayed write should not be inline"

664

msg = "revlog with delayed write should not be inline"

665

raise error.ProgrammingError(msg)

665

raise error.ProgrammingError(msg)

666

else:

666

else:

667

with self._segmentfile.reading():

667

with self._segmentfile.reading():

668

with self._segmentfile_sidedata.reading():

668

with self._segmentfile_sidedata.reading():

669

yield

669

yield

670

671

@property

671

@property

672

def is_writing(self):

672

def is_writing(self):

673

"""True is a writing context is open"""

673

"""True is a writing context is open"""

674

return self._writinghandles is not None

674

return self._writinghandles is not None

675

676

@property

676

@property

677

def is_open(self):

677

def is_open(self):

678

"""True if any file handle is being held

678

"""True if any file handle is being held

679

680

Used for assert and debug in the python code"""

680

Used for assert and debug in the python code"""

681

return self._segmentfile.is_open or self._segmentfile_sidedata.is_open

681

return self._segmentfile.is_open or self._segmentfile_sidedata.is_open

682

683

@contextlib.contextmanager

683

@contextlib.contextmanager

684

def writing(self, transaction, data_end=None, sidedata_end=None):

684

def writing(self, transaction, data_end=None, sidedata_end=None):

685

"""Open the revlog files for writing

685

"""Open the revlog files for writing

686

687

Add content to a revlog should be done within such context.

687

Add content to a revlog should be done within such context.

688

"""

688

"""

689

if self.is_writing:

689

if self.is_writing:

690

yield

690

yield

691

else:

691

else:

692

ifh = dfh = sdfh = None

692

ifh = dfh = sdfh = None

693

try:

693

try:

694

r = len(self.index)

694

r = len(self.index)

695

# opening the data file.

695

# opening the data file.

696

dsize = 0

696

dsize = 0

697

if r:

697

if r:

698

dsize = self.end(r - 1)

698

dsize = self.end(r - 1)

699

dfh = None

699

dfh = None

700

if not self.inline:

700

if not self.inline:

701

try:

701

try:

702

dfh = self.opener(self.data_file, mode=b"r+")

702

dfh = self.opener(self.data_file, mode=b"r+")

703

if data_end is None:

703

if data_end is None:

704

dfh.seek(0, os.SEEK_END)

704

dfh.seek(0, os.SEEK_END)

705

else:

705

else:

706

dfh.seek(data_end, os.SEEK_SET)

706

dfh.seek(data_end, os.SEEK_SET)

707

except FileNotFoundError:

707

except FileNotFoundError:

708

dfh = self.opener(self.data_file, mode=b"w+")

708

dfh = self.opener(self.data_file, mode=b"w+")

709

transaction.add(self.data_file, dsize)

709

transaction.add(self.data_file, dsize)

710

if self.sidedata_file is not None:

710

if self.sidedata_file is not None:

711

assert sidedata_end is not None

711

assert sidedata_end is not None

712

# revlog-v2 does not inline, help Pytype

712

# revlog-v2 does not inline, help Pytype

713

assert dfh is not None

713

assert dfh is not None

714

try:

714

try:

715

sdfh = self.opener(self.sidedata_file, mode=b"r+")

715

sdfh = self.opener(self.sidedata_file, mode=b"r+")

716

dfh.seek(sidedata_end, os.SEEK_SET)

716

dfh.seek(sidedata_end, os.SEEK_SET)

717

except FileNotFoundError:

717

except FileNotFoundError:

718

sdfh = self.opener(self.sidedata_file, mode=b"w+")

718

sdfh = self.opener(self.sidedata_file, mode=b"w+")

719

transaction.add(self.sidedata_file, sidedata_end)

719

transaction.add(self.sidedata_file, sidedata_end)

720

721

# opening the index file.

721

# opening the index file.

722

isize = r * self.index.entry_size

722

isize = r * self.index.entry_size

723

ifh = self.__index_write_fp()

723

ifh = self.__index_write_fp()

724

if self.inline:

724

if self.inline:

725

transaction.add(self.index_file, dsize + isize)

725

transaction.add(self.index_file, dsize + isize)

726

else:

726

else:

727

transaction.add(self.index_file, isize)

727

transaction.add(self.index_file, isize)

728

# exposing all file handle for writing.

728

# exposing all file handle for writing.

729

self._writinghandles = (ifh, dfh, sdfh)

729

self._writinghandles = (ifh, dfh, sdfh)

730

self._segmentfile.writing_handle = ifh if self.inline else dfh

730

self._segmentfile.writing_handle = ifh if self.inline else dfh

731

self._segmentfile_sidedata.writing_handle = sdfh

731

self._segmentfile_sidedata.writing_handle = sdfh

732

yield

732

yield

733

finally:

733

finally:

734

self._writinghandles = None

734

self._writinghandles = None

735

self._segmentfile.writing_handle = None

735

self._segmentfile.writing_handle = None

736

self._segmentfile_sidedata.writing_handle = None

736

self._segmentfile_sidedata.writing_handle = None

737

if dfh is not None:

737

if dfh is not None:

738

dfh.close()

738

dfh.close()

739

if sdfh is not None:

739

if sdfh is not None:

740

sdfh.close()

740

sdfh.close()

741

# closing the index file last to avoid exposing referent to

741

# closing the index file last to avoid exposing referent to

742

# potential unflushed data content.

742

# potential unflushed data content.

743

if ifh is not None:

743

if ifh is not None:

744

ifh.close()

744

ifh.close()

745

746

def __index_write_fp(self, index_end=None):

746

def __index_write_fp(self, index_end=None):

747

"""internal method to open the index file for writing

747

"""internal method to open the index file for writing

748

749

You should not use this directly and use `_writing` instead

749

You should not use this directly and use `_writing` instead

750

"""

750

"""

751

try:

751

try:

752

if self._delay_buffer is None:

752

if self._delay_buffer is None:

753

f = self.opener(

753

f = self.opener(

754

self.index_file,

754

self.index_file,

755

mode=b"r+",

755

mode=b"r+",

756

checkambig=self.data_config.check_ambig,

756

checkambig=self.data_config.check_ambig,

757

)

757

)

758

else:

758

else:

759

# check_ambig affect we way we open file for writing, however

759

# check_ambig affect we way we open file for writing, however

760

# here, we do not actually open a file for writting as write

760

# here, we do not actually open a file for writting as write

761

# will appened to a delay_buffer. So check_ambig is not

761

# will appened to a delay_buffer. So check_ambig is not

762

# meaningful and unneeded here.

762

# meaningful and unneeded here.

763

f = randomaccessfile.appender(

763

f = randomaccessfile.appender(

764

self.opener, self.index_file, b"r+", self._delay_buffer

764

self.opener, self.index_file, b"r+", self._delay_buffer

765

)

765

)

766

if index_end is None:

766

if index_end is None:

767

f.seek(0, os.SEEK_END)

767

f.seek(0, os.SEEK_END)

768

else:

768

else:

769

f.seek(index_end, os.SEEK_SET)

769

f.seek(index_end, os.SEEK_SET)

770

return f

770

return f

771

except FileNotFoundError:

771

except FileNotFoundError:

772

if self._delay_buffer is None:

772

if self._delay_buffer is None:

773

return self.opener(

773

return self.opener(

774

self.index_file,

774

self.index_file,

775

mode=b"w+",

775

mode=b"w+",

776

checkambig=self.data_config.check_ambig,

776

checkambig=self.data_config.check_ambig,

777

)

777

)

778

else:

778

else:

779

return randomaccessfile.appender(

779

return randomaccessfile.appender(

780

self.opener, self.index_file, b"w+", self._delay_buffer

780

self.opener, self.index_file, b"w+", self._delay_buffer

781

)

781

)

782

783

def __index_new_fp(self):

783

def __index_new_fp(self):

784

"""internal method to create a new index file for writing

784

"""internal method to create a new index file for writing

785

786

You should not use this unless you are upgrading from inline revlog

786

You should not use this unless you are upgrading from inline revlog

787

"""

787

"""

788

return self.opener(

788

return self.opener(

789

self.index_file,

789

self.index_file,

790

mode=b"w",

790

mode=b"w",

791

checkambig=self.data_config.check_ambig,

791

checkambig=self.data_config.check_ambig,

792

)

792

)

793

794

def split_inline(self, tr, header, new_index_file_path=None):

794

def split_inline(self, tr, header, new_index_file_path=None):

795

"""split the data of an inline revlog into an index and a data file"""

795

"""split the data of an inline revlog into an index and a data file"""

796

assert self._delay_buffer is None

796

assert self._delay_buffer is None

797

existing_handles = False

797

existing_handles = False

798

if self._writinghandles is not None:

798

if self._writinghandles is not None:

799

existing_handles = True

799

existing_handles = True

800

fp = self._writinghandles[0]

800

fp = self._writinghandles[0]

801

fp.flush()

801

fp.flush()

802

fp.close()

802

fp.close()

803

# We can't use the cached file handle after close(). So prevent

803

# We can't use the cached file handle after close(). So prevent

804

# its usage.

804

# its usage.

805

self._writinghandles = None

805

self._writinghandles = None

806

self._segmentfile.writing_handle = None

806

self._segmentfile.writing_handle = None

807

# No need to deal with sidedata writing handle as it is only

807

# No need to deal with sidedata writing handle as it is only

808

# relevant with revlog-v2 which is never inline, not reaching

808

# relevant with revlog-v2 which is never inline, not reaching

809

# this code

809

# this code

810

811

new_dfh = self.opener(self.data_file, mode=b"w+")

811

new_dfh = self.opener(self.data_file, mode=b"w+")

812

new_dfh.truncate(0) # drop any potentially existing data

812

new_dfh.truncate(0) # drop any potentially existing data

813

try:

813

try:

814

with self.reading():

814

with self.reading():

815

for r in range(len(self.index)):

815

for r in range(len(self.index)):

816

new_dfh.write(self.get_segment_for_revs(r, r)[1])

816

new_dfh.write(self.get_segment_for_revs(r, r)[1])

817

new_dfh.flush()

817

new_dfh.flush()

818

819

if new_index_file_path is not None:

819

if new_index_file_path is not None:

820

self.index_file = new_index_file_path

820

self.index_file = new_index_file_path

821

with self.__index_new_fp() as fp:

821

with self.__index_new_fp() as fp:

822

self.inline = False

822

self.inline = False

823

for i in range(len(self.index)):

823

for i in range(len(self.index)):

824

e = self.index.entry_binary(i)

824

e = self.index.entry_binary(i)

825

if i == 0:

825

if i == 0:

826

packed_header = self.index.pack_header(header)

826

packed_header = self.index.pack_header(header)

827

e = packed_header + e

827

e = packed_header + e

828

fp.write(e)

828

fp.write(e)

829

830

# If we don't use side-write, the temp file replace the real

830

# If we don't use side-write, the temp file replace the real

831

# index when we exit the context manager

831

# index when we exit the context manager

832

833

self._segmentfile = randomaccessfile.randomaccessfile(

833

self._segmentfile = randomaccessfile.randomaccessfile(

834

self.opener,

834

self.opener,

835

self.data_file,

835

self.data_file,

836

self.data_config.chunk_cache_size,

836

self.data_config.chunk_cache_size,

837

)

837

)

838

839

if existing_handles:

839

if existing_handles:

840

# switched from inline to conventional reopen the index

840

# switched from inline to conventional reopen the index

841

ifh = self.__index_write_fp()

841

ifh = self.__index_write_fp()

842

self._writinghandles = (ifh, new_dfh, None)

842

self._writinghandles = (ifh, new_dfh, None)

843

self._segmentfile.writing_handle = new_dfh

843

self._segmentfile.writing_handle = new_dfh

844

new_dfh = None

844

new_dfh = None

845

# No need to deal with sidedata writing handle as it is only

845

# No need to deal with sidedata writing handle as it is only

846

# relevant with revlog-v2 which is never inline, not reaching

846

# relevant with revlog-v2 which is never inline, not reaching

847

# this code

847

# this code

848

finally:

848

finally:

849

if new_dfh is not None:

849

if new_dfh is not None:

850

new_dfh.close()

850

new_dfh.close()

851

return self.index_file

851

return self.index_file

852

853

def get_segment_for_revs(self, startrev, endrev):

853

def get_segment_for_revs(self, startrev, endrev):

854

"""Obtain a segment of raw data corresponding to a range of revisions.

854

"""Obtain a segment of raw data corresponding to a range of revisions.

855

856

Accepts the start and end revisions and an optional already-open

856

Accepts the start and end revisions and an optional already-open

857

file handle to be used for reading. If the file handle is read, its

857

file handle to be used for reading. If the file handle is read, its

858

seek position will not be preserved.

858

seek position will not be preserved.

859

860

Requests for data may be satisfied by a cache.

860

Requests for data may be satisfied by a cache.

861

862

Returns a 2-tuple of (offset, data) for the requested range of

862

Returns a 2-tuple of (offset, data) for the requested range of

863

revisions. Offset is the integer offset from the beginning of the

863

revisions. Offset is the integer offset from the beginning of the

864

revlog and data is a str or buffer of the raw byte data.

864

revlog and data is a str or buffer of the raw byte data.

865

866

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

866

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

867

to determine where each revision's data begins and ends.

867

to determine where each revision's data begins and ends.

868

869

API: we should consider making this a private part of the InnerRevlog

869

API: we should consider making this a private part of the InnerRevlog

870

at some point.

870

at some point.

871

"""

871

"""

872

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

872

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

873

# (functions are expensive).

873

# (functions are expensive).

874

index = self.index

874

index = self.index

875

istart = index[startrev]

875

istart = index[startrev]

876

start = int(istart[0] >> 16)

876

start = int(istart[0] >> 16)

877

if startrev == endrev:

877

if startrev == endrev:

878

end = start + istart[1]

878

end = start + istart[1]

879

else:

879

else:

880

iend = index[endrev]

880

iend = index[endrev]

881

end = int(iend[0] >> 16) + iend[1]

881

end = int(iend[0] >> 16) + iend[1]

882

883

if self.inline:

883

if self.inline:

884

start += (startrev + 1) * self.index.entry_size

884

start += (startrev + 1) * self.index.entry_size

885

end += (endrev + 1) * self.index.entry_size

885

end += (endrev + 1) * self.index.entry_size

886

length = end - start

886

length = end - start

887

888

return start, self._segmentfile.read_chunk(start, length)

888

return start, self._segmentfile.read_chunk(start, length)

889

890

def _chunk(self, rev):

890

def _chunk(self, rev):

891

"""Obtain a single decompressed chunk for a revision.

891

"""Obtain a single decompressed chunk for a revision.

892

893

Accepts an integer revision and an optional already-open file handle

893

Accepts an integer revision and an optional already-open file handle

894

to be used for reading. If used, the seek position of the file will not

894

to be used for reading. If used, the seek position of the file will not

895

be preserved.

895

be preserved.

896

897

Returns a str holding uncompressed data for the requested revision.

897

Returns a str holding uncompressed data for the requested revision.

898

"""

898

"""

899

if self._uncompressed_chunk_cache is not None:

899

if self._uncompressed_chunk_cache is not None:

900

uncomp = self._uncompressed_chunk_cache.get(rev)

900

uncomp = self._uncompressed_chunk_cache.get(rev)

901

if uncomp is not None:

901

if uncomp is not None:

902

return uncomp

902

return uncomp

903

904

compression_mode = self.index[rev][10]

904

compression_mode = self.index[rev][10]

905

data = self.get_segment_for_revs(rev, rev)[1]

905

data = self.get_segment_for_revs(rev, rev)[1]

906

if compression_mode == COMP_MODE_PLAIN:

906

if compression_mode == COMP_MODE_PLAIN:

907

uncomp = data

907

uncomp = data

908

elif compression_mode == COMP_MODE_DEFAULT:

908

elif compression_mode == COMP_MODE_DEFAULT:

909

uncomp = self._decompressor(data)

909

uncomp = self._decompressor(data)

910

elif compression_mode == COMP_MODE_INLINE:

910

elif compression_mode == COMP_MODE_INLINE:

911

uncomp = self.decompress(data)

911

uncomp = self.decompress(data)

912

else:

912

else:

913

msg = b'unknown compression mode %d'

913

msg = b'unknown compression mode %d'

914

msg %= compression_mode

914

msg %= compression_mode

915

raise error.RevlogError(msg)

915

raise error.RevlogError(msg)

916

if self._uncompressed_chunk_cache is not None:

916

if self._uncompressed_chunk_cache is not None:

917

self._uncompressed_chunk_cache.insert(rev, uncomp, cost=len(uncomp))

917

self._uncompressed_chunk_cache.insert(rev, uncomp, cost=len(uncomp))

918

return uncomp

918

return uncomp

919

920

def _chunks(self, revs, targetsize=None):

920

def _chunks(self, revs, targetsize=None):

921

"""Obtain decompressed chunks for the specified revisions.

921

"""Obtain decompressed chunks for the specified revisions.

922

923

Accepts an iterable of numeric revisions that are assumed to be in

923

Accepts an iterable of numeric revisions that are assumed to be in

924

ascending order.

924

ascending order.

925

926

This function is similar to calling ``self._chunk()`` multiple times,

926

This function is similar to calling ``self._chunk()`` multiple times,

927

but is faster.

927

but is faster.

928

929

Returns a list with decompressed data for each requested revision.

929

Returns a list with decompressed data for each requested revision.

930

"""

930

"""

931

if not revs:

931

if not revs:

932

return []

932

return []

933

start = self.start

933

start = self.start

934

length = self.length

934

length = self.length

935

inline = self.inline

935

inline = self.inline

936

iosize = self.index.entry_size

936

iosize = self.index.entry_size

937

buffer = util.buffer

937

buffer = util.buffer

938

939

fetched_revs = []

939

fetched_revs = []

940

fadd = fetched_revs.append

940

fadd = fetched_revs.append

941

942

chunks = []

942

chunks = []

943

ladd = chunks.append

943

ladd = chunks.append

944

945

if self._uncompressed_chunk_cache is None:

945

if self._uncompressed_chunk_cache is None:

946

fetched_revs = revs

946

fetched_revs = revs

947

else:

947

else:

948

for rev in revs:

948

for rev in revs:

949

cached_value = self._uncompressed_chunk_cache.get(rev)

949

cached_value = self._uncompressed_chunk_cache.get(rev)

950

if cached_value is None:

950

if cached_value is None:

951

fadd(rev)

951

fadd(rev)

952

else:

952

else:

953

ladd((rev, cached_value))

953

ladd((rev, cached_value))

954

955

if not fetched_revs:

955

if not fetched_revs:

956

slicedchunks = ()

956

slicedchunks = ()

957

elif not self.data_config.with_sparse_read:

957

elif not self.data_config.with_sparse_read:

958

slicedchunks = (fetched_revs,)

958

slicedchunks = (fetched_revs,)

959

else:

959

else:

960

slicedchunks = deltautil.slicechunk(

960

slicedchunks = deltautil.slicechunk(

961

self,

961

self,

962

fetched_revs,

962

fetched_revs,

963

targetsize=targetsize,

963

targetsize=targetsize,

964

)

964

)

965

966

for revschunk in slicedchunks:

966

for revschunk in slicedchunks:

967

firstrev = revschunk[0]

967

firstrev = revschunk[0]

968

# Skip trailing revisions with empty diff

968

# Skip trailing revisions with empty diff

969

for lastrev in revschunk[::-1]:

969

for lastrev in revschunk[::-1]:

970

if length(lastrev) != 0:

970

if length(lastrev) != 0:

971

break

971

break

972

973

try:

973

try:

974

offset, data = self.get_segment_for_revs(firstrev, lastrev)

974

offset, data = self.get_segment_for_revs(firstrev, lastrev)

975

except OverflowError:

975

except OverflowError:

976

# issue4215 - we can't cache a run of chunks greater than

976

# issue4215 - we can't cache a run of chunks greater than

977

# 2G on Windows

977

# 2G on Windows

978

for rev in revschunk:

978

for rev in revschunk:

979

ladd((rev, self._chunk(rev)))

979

ladd((rev, self._chunk(rev)))

980

981

decomp = self.decompress

981

decomp = self.decompress

982

# self._decompressor might be None, but will not be used in that case

982

# self._decompressor might be None, but will not be used in that case

983

def_decomp = self._decompressor

983

def_decomp = self._decompressor

984

for rev in revschunk:

984

for rev in revschunk:

985

chunkstart = start(rev)

985

chunkstart = start(rev)

986

if inline:

986

if inline:

987

chunkstart += (rev + 1) * iosize

987

chunkstart += (rev + 1) * iosize

988

chunklength = length(rev)

988

chunklength = length(rev)

989

comp_mode = self.index[rev][10]

989

comp_mode = self.index[rev][10]

990

c = buffer(data, chunkstart - offset, chunklength)

990

c = buffer(data, chunkstart - offset, chunklength)

991

if comp_mode == COMP_MODE_PLAIN:

991

if comp_mode == COMP_MODE_PLAIN:

992

c = c

992

c = c

993

elif comp_mode == COMP_MODE_INLINE:

993

elif comp_mode == COMP_MODE_INLINE:

994

c = decomp(c)

994

c = decomp(c)

995

elif comp_mode == COMP_MODE_DEFAULT:

995

elif comp_mode == COMP_MODE_DEFAULT:

996

c = def_decomp(c)

996

c = def_decomp(c)

997

else:

997

else:

998

msg = b'unknown compression mode %d'

998

msg = b'unknown compression mode %d'

999

msg %= comp_mode

999

msg %= comp_mode

1000

raise error.RevlogError(msg)

1000

raise error.RevlogError(msg)

1001

ladd((rev, c))

1001

ladd((rev, c))

1002

if self._uncompressed_chunk_cache is not None:

1002

if self._uncompressed_chunk_cache is not None:

1003

self._uncompressed_chunk_cache.insert(rev, c, len(c))

1003

self._uncompressed_chunk_cache.insert(rev, c, len(c))

1004

1005

chunks.sort()

1005

chunks.sort()

1006

return [x[1] for x in chunks]

1006

return [x[1] for x in chunks]

1007

1008

def raw_text(self, node, rev) -> bytes:

1008

def raw_text(self, node, rev) -> bytes:

1009

"""return the possibly unvalidated rawtext for a revision

1009

"""return the possibly unvalidated rawtext for a revision

1010

1011

returns rawtext

1011

returns rawtext

1012

"""

1012

"""

1013

1014

# revision in the cache (could be useful to apply delta)

1014

# revision in the cache (could be useful to apply delta)

1015

cachedrev = None

1015

cachedrev = None

1016

# An intermediate text to apply deltas to

1016

# An intermediate text to apply deltas to

1017

basetext = None

1017

basetext = None

1018

1019

# Check if we have the entry in cache

1019

# Check if we have the entry in cache

1020

# The cache entry looks like (node, rev, rawtext)

1020

# The cache entry looks like (node, rev, rawtext)

1021

if self._revisioncache:

1021

if self._revisioncache:

1022

cachedrev = self._revisioncache[1]

1022

cachedrev = self._revisioncache[1]

1023

1024

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

1024

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

1025

if stopped:

1025

if stopped:

1026

basetext = self._revisioncache[2]

1026

basetext = self._revisioncache[2]

1027

1028

# drop cache to save memory, the caller is expected to

1028

# drop cache to save memory, the caller is expected to

1029

# update self._inner._revisioncache after validating the text

1029

# update self._inner._revisioncache after validating the text

1030

self._revisioncache = None

1030

self._revisioncache = None

1031

1032

targetsize = None

1032

targetsize = None

1033

rawsize = self.index[rev][2]

1033

rawsize = self.index[rev][2]

1034

if 0 <= rawsize:

1034

if 0 <= rawsize:

1035

targetsize = 4 * rawsize

1035

targetsize = 4 * rawsize

1036

1037

if self._uncompressed_chunk_cache is not None:

1037

if self._uncompressed_chunk_cache is not None:

1038

# dynamically update the uncompressed_chunk_cache size to the

1038

# dynamically update the uncompressed_chunk_cache size to the

1039

# largest revision we saw in this revlog.

1039

# largest revision we saw in this revlog.

1040

factor = self.data_config.uncompressed_cache_factor

1040

factor = self.data_config.uncompressed_cache_factor

1041

candidate_size = rawsize * factor

1041

candidate_size = rawsize * factor

1042

if candidate_size > self._uncompressed_chunk_cache.maxcost:

1042

if candidate_size > self._uncompressed_chunk_cache.maxcost:

1043

self._uncompressed_chunk_cache.maxcost = candidate_size

1043

self._uncompressed_chunk_cache.maxcost = candidate_size

1044

1045

bins = self._chunks(chain, targetsize=targetsize)

1045

bins = self._chunks(chain, targetsize=targetsize)

1046

if basetext is None:

1046

if basetext is None:

1047

basetext = bytes(bins[0])

1047

basetext = bytes(bins[0])

1048

bins = bins[1:]

1048

bins = bins[1:]

1049

1050

rawtext = mdiff.patches(basetext, bins)

1050

rawtext = mdiff.patches(basetext, bins)

1051

del basetext # let us have a chance to free memory early

1051

del basetext # let us have a chance to free memory early

1052

return rawtext

1052

return rawtext

1053

1054

def sidedata(self, rev, sidedata_end):

1054

def sidedata(self, rev, sidedata_end):

1055

"""Return the sidedata for a given revision number."""

1055

"""Return the sidedata for a given revision number."""

1056

index_entry = self.index[rev]

1056

index_entry = self.index[rev]

1057

sidedata_offset = index_entry[8]

1057

sidedata_offset = index_entry[8]

1058

sidedata_size = index_entry[9]

1058

sidedata_size = index_entry[9]

1059

1060

if self.inline:

1060

if self.inline:

1061

sidedata_offset += self.index.entry_size * (1 + rev)

1061

sidedata_offset += self.index.entry_size * (1 + rev)

1062

if sidedata_size == 0:

1062

if sidedata_size == 0:

1063

return {}

1063

return {}

1064

1065

if sidedata_end < sidedata_offset + sidedata_size:

1065

if sidedata_end < sidedata_offset + sidedata_size:

1066

filename = self.sidedata_file

1066

filename = self.sidedata_file

1067

end = sidedata_end

1067

end = sidedata_end

1068

offset = sidedata_offset

1068

offset = sidedata_offset

1069

length = sidedata_size

1069

length = sidedata_size

1070

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

1070

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

1071

raise error.RevlogError(m)

1071

raise error.RevlogError(m)

1072

1073

comp_segment = self._segmentfile_sidedata.read_chunk(

1073

comp_segment = self._segmentfile_sidedata.read_chunk(

1074

sidedata_offset, sidedata_size

1074

sidedata_offset, sidedata_size

1075

)

1075

)

1076

1077

comp = self.index[rev][11]

1077

comp = self.index[rev][11]

1078

if comp == COMP_MODE_PLAIN:

1078

if comp == COMP_MODE_PLAIN:

1079

segment = comp_segment

1079

segment = comp_segment

1080

elif comp == COMP_MODE_DEFAULT:

1080

elif comp == COMP_MODE_DEFAULT:

1081

segment = self._decompressor(comp_segment)

1081

segment = self._decompressor(comp_segment)

1082

elif comp == COMP_MODE_INLINE:

1082

elif comp == COMP_MODE_INLINE:

1083

segment = self.decompress(comp_segment)

1083

segment = self.decompress(comp_segment)

1084

else:

1084

else:

1085

msg = b'unknown compression mode %d'

1085

msg = b'unknown compression mode %d'

1086

msg %= comp

1086

msg %= comp

1087

raise error.RevlogError(msg)

1087

raise error.RevlogError(msg)

1088

1089

sidedata = sidedatautil.deserialize_sidedata(segment)

1089

sidedata = sidedatautil.deserialize_sidedata(segment)

1090

return sidedata

1090

return sidedata

1091

1092

def write_entry(

1092

def write_entry(

1093

self,

1093

self,

1094

transaction,

1094

transaction,

1095

entry,

1095

entry,

1096

data,

1096

data,

1097

link,

1097

link,

1098

offset,

1098

offset,

1099

sidedata,

1099

sidedata,

1100

sidedata_offset,

1100

sidedata_offset,

1101

index_end,

1101

index_end,

1102

data_end,

1102

data_end,

1103

sidedata_end,

1103

sidedata_end,

1104

):

1104

):

1105

# Files opened in a+ mode have inconsistent behavior on various

1105

# Files opened in a+ mode have inconsistent behavior on various

1106

# platforms. Windows requires that a file positioning call be made

1106

# platforms. Windows requires that a file positioning call be made

1107

# when the file handle transitions between reads and writes. See

1107

# when the file handle transitions between reads and writes. See

1108

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

1108

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

1109

# platforms, Python or the platform itself can be buggy. Some versions

1109

# platforms, Python or the platform itself can be buggy. Some versions

1110

# of Solaris have been observed to not append at the end of the file

1110

# of Solaris have been observed to not append at the end of the file

1111

# if the file was seeked to before the end. See issue4943 for more.

1111

# if the file was seeked to before the end. See issue4943 for more.

1112

#

1112

#

1113

# We work around this issue by inserting a seek() before writing.

1113

# We work around this issue by inserting a seek() before writing.

1114

# Note: This is likely not necessary on Python 3. However, because

1114

# Note: This is likely not necessary on Python 3. However, because

1115

# the file handle is reused for reads and may be seeked there, we need

1115

# the file handle is reused for reads and may be seeked there, we need

1116

# to be careful before changing this.

1116

# to be careful before changing this.

1117

if self._writinghandles is None:

1117

if self._writinghandles is None:

1118

msg = b'adding revision outside `revlog._writing` context'

1118

msg = b'adding revision outside `revlog._writing` context'

1119

raise error.ProgrammingError(msg)

1119

raise error.ProgrammingError(msg)

1120

ifh, dfh, sdfh = self._writinghandles

1120

ifh, dfh, sdfh = self._writinghandles

1121

if index_end is None:

1121

if index_end is None:

1122

ifh.seek(0, os.SEEK_END)

1122

ifh.seek(0, os.SEEK_END)

1123

else:

1123

else:

1124

ifh.seek(index_end, os.SEEK_SET)

1124

ifh.seek(index_end, os.SEEK_SET)

1125

if dfh:

1125

if dfh:

1126

if data_end is None:

1126

if data_end is None:

1127

dfh.seek(0, os.SEEK_END)

1127

dfh.seek(0, os.SEEK_END)

1128

else:

1128

else:

1129

dfh.seek(data_end, os.SEEK_SET)

1129

dfh.seek(data_end, os.SEEK_SET)

1130

if sdfh:

1130

if sdfh:

1131

sdfh.seek(sidedata_end, os.SEEK_SET)

1131

sdfh.seek(sidedata_end, os.SEEK_SET)

1132

1133

curr = len(self.index) - 1

1133

curr = len(self.index) - 1

1134

if not self.inline:

1134

if not self.inline:

1135

transaction.add(self.data_file, offset)

1135

transaction.add(self.data_file, offset)

1136

if self.sidedata_file:

1136

if self.sidedata_file:

1137

transaction.add(self.sidedata_file, sidedata_offset)

1137

transaction.add(self.sidedata_file, sidedata_offset)

1138

transaction.add(self.canonical_index_file, curr * len(entry))

1138

transaction.add(self.canonical_index_file, curr * len(entry))

1139

if data[0]:

1139

if data[0]:

1140

dfh.write(data[0])

1140

dfh.write(data[0])

1141

dfh.write(data[1])

1141

dfh.write(data[1])

1142

if sidedata:

1142

if sidedata:

1143

sdfh.write(sidedata)

1143

sdfh.write(sidedata)

1144

if self._delay_buffer is None:

1144

if self._delay_buffer is None:

1145

ifh.write(entry)

1145

ifh.write(entry)

1146

else:

1146

else:

1147

self._delay_buffer.append(entry)

1147

self._delay_buffer.append(entry)

1148

elif self._delay_buffer is not None:

1148

elif self._delay_buffer is not None:

1149

msg = b'invalid delayed write on inline revlog'

1149

msg = b'invalid delayed write on inline revlog'

1150

raise error.ProgrammingError(msg)

1150

raise error.ProgrammingError(msg)

1151

else:

1151

else:

1152

offset += curr * self.index.entry_size

1152

offset += curr * self.index.entry_size

1153

transaction.add(self.canonical_index_file, offset)

1153

transaction.add(self.canonical_index_file, offset)

1154

assert not sidedata

1154

assert not sidedata

1155

ifh.write(entry)

1155

ifh.write(entry)

1156

ifh.write(data[0])

1156

ifh.write(data[0])

1157

ifh.write(data[1])

1157

ifh.write(data[1])

1158

return (

1158

return (

1159

ifh.tell(),

1159

ifh.tell(),

1160

dfh.tell() if dfh else None,

1160

dfh.tell() if dfh else None,

1161

sdfh.tell() if sdfh else None,

1161

sdfh.tell() if sdfh else None,

1162

)

1162

)

1163

1164

def _divert_index(self):

1164

def _divert_index(self):

1165

index_file = self.index_file

1165

index_file = self.index_file

1166

# when we encounter a legacy inline-changelog, split it. However it is

1166

# when we encounter a legacy inline-changelog, split it. However it is

1167

# important to use the expected filename for pending content

1167

# important to use the expected filename for pending content

1168

# (<radix>.a) otherwise hooks won't be seeing the content of the

1168

# (<radix>.a) otherwise hooks won't be seeing the content of the

1169

# pending transaction.

1169

# pending transaction.

1170

if index_file.endswith(b'.s'):

1170

if index_file.endswith(b'.s'):

1171

index_file = self.index_file[:-2]

1171

index_file = self.index_file[:-2]

1172

return index_file + b'.a'

1172

return index_file + b'.a'

1173

1174

def delay(self):

1174

def delay(self):

1175

assert not self.is_open

1175

assert not self.is_open

1176

if self.inline:

1176

if self.inline:

1177

msg = "revlog with delayed write should not be inline"

1177

msg = "revlog with delayed write should not be inline"

1178

raise error.ProgrammingError(msg)

1178

raise error.ProgrammingError(msg)

1179

if self._delay_buffer is not None or self._orig_index_file is not None:

1179

if self._delay_buffer is not None or self._orig_index_file is not None:

1180

# delay or divert already in place

1180

# delay or divert already in place

1181

return None

1181

return None

1182

elif len(self.index) == 0:

1182

elif len(self.index) == 0:

1183

self._orig_index_file = self.index_file

1183

self._orig_index_file = self.index_file

1184

self.index_file = self._divert_index()

1184

self.index_file = self._divert_index()

1185

assert self._orig_index_file is not None

1185

assert self._orig_index_file is not None

1186

assert self.index_file is not None

1186

assert self.index_file is not None

1187

if self.opener.exists(self.index_file):

1187

if self.opener.exists(self.index_file):

1188

self.opener.unlink(self.index_file)

1188

self.opener.unlink(self.index_file)

1189

return self.index_file

1189

return self.index_file

1190

else:

1190

else:

1191

self._delay_buffer = []

1191

self._delay_buffer = []

1192

return None

1192

return None

1193

1194

def write_pending(self):

1194

def write_pending(self):

1195

assert not self.is_open

1195

assert not self.is_open

1196

if self.inline:

1196

if self.inline:

1197

msg = "revlog with delayed write should not be inline"

1197

msg = "revlog with delayed write should not be inline"

1198

raise error.ProgrammingError(msg)

1198

raise error.ProgrammingError(msg)

1199

if self._orig_index_file is not None:

1199

if self._orig_index_file is not None:

1200

return None, True

1200

return None, True

1201

any_pending = False

1201

any_pending = False

1202

pending_index_file = self._divert_index()

1202

pending_index_file = self._divert_index()

1203

if self.opener.exists(pending_index_file):

1203

if self.opener.exists(pending_index_file):

1204

self.opener.unlink(pending_index_file)

1204

self.opener.unlink(pending_index_file)

1205

util.copyfile(

1205

util.copyfile(

1206

self.opener.join(self.index_file),

1206

self.opener.join(self.index_file),

1207

self.opener.join(pending_index_file),

1207

self.opener.join(pending_index_file),

1208

)

1208

)

1209

if self._delay_buffer:

1209

if self._delay_buffer:

1210

with self.opener(pending_index_file, b'r+') as ifh:

1210

with self.opener(pending_index_file, b'r+') as ifh:

1211

ifh.seek(0, os.SEEK_END)

1211

ifh.seek(0, os.SEEK_END)

1212

ifh.write(b"".join(self._delay_buffer))

1212

ifh.write(b"".join(self._delay_buffer))

1213

any_pending = True

1213

any_pending = True

1214

self._delay_buffer = None

1214

self._delay_buffer = None

1215

self._orig_index_file = self.index_file

1215

self._orig_index_file = self.index_file

1216

self.index_file = pending_index_file

1216

self.index_file = pending_index_file

1217

return self.index_file, any_pending

1217

return self.index_file, any_pending

1218

1219

def finalize_pending(self):

1219

def finalize_pending(self):

1220

assert not self.is_open

1220

assert not self.is_open

1221

if self.inline:

1221

if self.inline:

1222

msg = "revlog with delayed write should not be inline"

1222

msg = "revlog with delayed write should not be inline"

1223

raise error.ProgrammingError(msg)

1223

raise error.ProgrammingError(msg)

1224

1225

delay = self._delay_buffer is not None

1225

delay = self._delay_buffer is not None

1226

divert = self._orig_index_file is not None

1226

divert = self._orig_index_file is not None

1227

1228

if delay and divert:

1228

if delay and divert:

1229

assert False, "unreachable"

1229

assert False, "unreachable"

1230

elif delay:

1230

elif delay:

1231

if self._delay_buffer:

1231

if self._delay_buffer:

1232

with self.opener(self.index_file, b'r+') as ifh:

1232

with self.opener(self.index_file, b'r+') as ifh:

1233

ifh.seek(0, os.SEEK_END)

1233

ifh.seek(0, os.SEEK_END)

1234

ifh.write(b"".join(self._delay_buffer))

1234

ifh.write(b"".join(self._delay_buffer))

1235

self._delay_buffer = None

1235

self._delay_buffer = None

1236

elif divert:

1236

elif divert:

1237

if self.opener.exists(self.index_file):

1237

if self.opener.exists(self.index_file):

1238

self.opener.rename(

1238

self.opener.rename(

1239

self.index_file,

1239

self.index_file,

1240

self._orig_index_file,

1240

self._orig_index_file,

1241

checkambig=True,

1241

checkambig=True,

1242

)

1242

)

1243

self.index_file = self._orig_index_file

1243

self.index_file = self._orig_index_file

1244

self._orig_index_file = None

1244

self._orig_index_file = None

1245

else:

1245

else:

1246

msg = b"not delay or divert found on this revlog"

1246

msg = b"not delay or divert found on this revlog"

1247

raise error.ProgrammingError(msg)

1247

raise error.ProgrammingError(msg)

1248

return self.canonical_index_file

1248

return self.canonical_index_file

1249

1250

1251

if typing.TYPE_CHECKING:

1251

if typing.TYPE_CHECKING:

1252

# Tell Pytype what kind of object we expect

1252

# Tell Pytype what kind of object we expect

1253

ProxyBase = BaseIndexObject

1253

ProxyBase = BaseIndexObject

1254

else:

1254

else:

1255

ProxyBase = object

1255

ProxyBase = object

1256

1257

1258

class RustIndexProxy(ProxyBase):

1258

class RustIndexProxy(ProxyBase):

1259

"""Wrapper around the Rust index to fake having direct access to the index.

1259

"""Wrapper around the Rust index to fake having direct access to the index.

1260

1261

Rust enforces xor mutability (one mutable reference XOR 1..n non-mutable),

1261

Rust enforces xor mutability (one mutable reference XOR 1..n non-mutable),

1262

so we can't expose the index from Rust directly, since the `InnerRevlog`

1262

so we can't expose the index from Rust directly, since the `InnerRevlog`

1263

already has ownership of the index. This object redirects all calls to the

1263

already has ownership of the index. This object redirects all calls to the

1264

index through the Rust-backed `InnerRevlog` glue which defines all

1264

index through the Rust-backed `InnerRevlog` glue which defines all

1265

necessary forwarding methods.

1265

necessary forwarding methods.

1266

"""

1266

"""

1267

1268

def __init__(self, inner):

1268

def __init__(self, inner):

1269

# Do not rename as it's being used to access the index from Rust

1269

# Do not rename as it's being used to access the index from Rust

1270

self.inner = inner

1270

self.inner = inner

1271

1272

# TODO possibly write all index methods manually to save on overhead?

1272

# TODO possibly write all index methods manually to save on overhead?

1273

def __getattr__(self, name):

1273

def __getattr__(self, name):

1274

return getattr(self.inner, f"_index_{name}")

1274

return getattr(self.inner, f"_index_{name}")

1275

1276

# Magic methods need to be defined explicitely

1276

# Magic methods need to be defined explicitely

1277

def __len__(self):

1277

def __len__(self):

1278

return self.inner._index___len__()

1278

return self.inner._index___len__()

1279

1280

def __getitem__(self, key):

1280

def __getitem__(self, key):

1281

return self.inner._index___getitem__(key)

1281

return self.inner._index___getitem__(key)

1282

1283

def __contains__(self, key):

1283

def __contains__(self, key):

1284

return self.inner._index___contains__(key)

1284

return self.inner._index___contains__(key)

1285

1286

def __delitem__(self, key):

1286

def __delitem__(self, key):

1287

return self.inner._index___delitem__(key)

1287

return self.inner._index___delitem__(key)

1288

1289

1290

class RustVFSWrapper:

1290

class RustVFSWrapper:

1291

"""Used to wrap a Python VFS to pass it to Rust to lower the overhead of

1291

"""Used to wrap a Python VFS to pass it to Rust to lower the overhead of

1292

calling back multiple times into Python.

1292

calling back multiple times into Python.

1293

"""

1293

"""

1294

1295

def __init__(self, inner):

1295

def __init__(self, inner):

1296

self.inner = inner

1296

self.inner = inner

1297

1298

def __call__(

1298

def __call__(

1299

self,

1299

self,

1300

path: bytes,

1300

path: bytes,

1301

mode: bytes = b"rb",

1301

mode: bytes = b"rb",

1302

atomictemp=False,

1302

atomictemp=False,

1303

checkambig=False,

1303

checkambig=False,

1304

):

1304

):

1305

fd = self.inner.__call__(

1305

fd = self.inner.__call__(

1306

path=path, mode=mode, atomictemp=atomictemp, checkambig=checkambig

1306

path=path, mode=mode, atomictemp=atomictemp, checkambig=checkambig

1307

)

1307

)

1308

# Information that Rust needs to get ownership of the file that's

1308

# Information that Rust needs to get ownership of the file that's

1309

# being opened.

1309

# being opened.

1310

return (os.dup(fd.fileno()), fd._tempname if atomictemp else None)

1310

return (os.dup(fd.fileno()), fd._tempname if atomictemp else None)

1311

1312

def __getattr__(self, name):

1312

def __getattr__(self, name):

1313

return getattr(self.inner, name)

1313

return getattr(self.inner, name)

1314

1315

1316

class revlog:

1316

class revlog:

1317

"""

1317

"""

1318

the underlying revision storage object

1318

the underlying revision storage object

1319

1320

A revlog consists of two parts, an index and the revision data.

1320

A revlog consists of two parts, an index and the revision data.

1321

1322

The index is a file with a fixed record size containing

1322

The index is a file with a fixed record size containing

1323

information on each revision, including its nodeid (hash), the

1323

information on each revision, including its nodeid (hash), the

1324

nodeids of its parents, the position and offset of its data within

1324

nodeids of its parents, the position and offset of its data within

1325

the data file, and the revision it's based on. Finally, each entry

1325

the data file, and the revision it's based on. Finally, each entry

1326

contains a linkrev entry that can serve as a pointer to external

1326

contains a linkrev entry that can serve as a pointer to external

1327

data.

1327

data.

1328

1329

The revision data itself is a linear collection of data chunks.

1329

The revision data itself is a linear collection of data chunks.

1330

Each chunk represents a revision and is usually represented as a

1330

Each chunk represents a revision and is usually represented as a

1331

delta against the previous chunk. To bound lookup time, runs of

1331

delta against the previous chunk. To bound lookup time, runs of

1332

deltas are limited to about 2 times the length of the original

1332

deltas are limited to about 2 times the length of the original

1333

version data. This makes retrieval of a version proportional to

1333

version data. This makes retrieval of a version proportional to

1334

its size, or O(1) relative to the number of revisions.

1334

its size, or O(1) relative to the number of revisions.

1335

1336

Both pieces of the revlog are written to in an append-only

1336

Both pieces of the revlog are written to in an append-only

1337

fashion, which means we never need to rewrite a file to insert or

1337

fashion, which means we never need to rewrite a file to insert or

1338

remove data, and can use some simple techniques to avoid the need

1338

remove data, and can use some simple techniques to avoid the need

1339

for locking while reading.

1339

for locking while reading.

1340

1341

If checkambig, indexfile is opened with checkambig=True at

1341

If checkambig, indexfile is opened with checkambig=True at

1342

writing, to avoid file stat ambiguity.

1342

writing, to avoid file stat ambiguity.

1343

1344

If mmaplargeindex is True, and an mmapindexthreshold is set, the

1344

If mmaplargeindex is True, and an mmapindexthreshold is set, the

1345

index will be mmapped rather than read if it is larger than the

1345

index will be mmapped rather than read if it is larger than the

1346

configured threshold.

1346

configured threshold.

1347

1348

If censorable is True, the revlog can have censored revisions.

1348

If censorable is True, the revlog can have censored revisions.

1349

1350

If `upperboundcomp` is not None, this is the expected maximal gain from

1350

If `upperboundcomp` is not None, this is the expected maximal gain from

1351

compression for the data content.

1351

compression for the data content.

1352

1353

`concurrencychecker` is an optional function that receives 3 arguments: a

1353

`concurrencychecker` is an optional function that receives 3 arguments: a

1354

file handle, a filename, and an expected position. It should check whether

1354

file handle, a filename, and an expected position. It should check whether

1355

the current position in the file handle is valid, and log/warn/fail (by

1355

the current position in the file handle is valid, and log/warn/fail (by

1356

raising).

1356

raising).

1357

1358

See mercurial/revlogutils/contants.py for details about the content of an

1358

See mercurial/revlogutils/contants.py for details about the content of an

1359

index entry.

1359

index entry.

1360

"""

1360

"""

1361

1362

_flagserrorclass = error.RevlogError

1362

_flagserrorclass = error.RevlogError

1363

_inner: "_InnerRevlog"

1363

_inner: "_InnerRevlog"

1364

1365

opener: vfsmod.vfs

1365

opener: vfsmod.vfs

1366

1367

@staticmethod

1367

@staticmethod

1368

def is_inline_index(header_bytes):

1368

def is_inline_index(header_bytes):

1369

"""Determine if a revlog is inline from the initial bytes of the index"""

1369

"""Determine if a revlog is inline from the initial bytes of the index"""

1370

if len(header_bytes) == 0:

1370

if len(header_bytes) == 0:

1371

return True

1371

return True

1372

1373

header = INDEX_HEADER.unpack(header_bytes)[0]

1373

header = INDEX_HEADER.unpack(header_bytes)[0]

1374

1375

_format_flags = header & ~0xFFFF

1375

_format_flags = header & ~0xFFFF

1376

_format_version = header & 0xFFFF

1376

_format_version = header & 0xFFFF

1377

1378

features = FEATURES_BY_VERSION[_format_version]

1378

features = FEATURES_BY_VERSION[_format_version]

1379

return features[b'inline'](_format_flags)

1379

return features[b'inline'](_format_flags)

1380

1381

_docket_file: Optional[bytes]

1381

_docket_file: Optional[bytes]

1382

1383

def __init__(

1383

def __init__(

1384

self,

1384

self,

1385

opener: vfsmod.vfs,

1385

opener: vfsmod.vfs,

1386

target,

1386

target,

1387

radix,

1387

radix,

1388

postfix=None, # only exist for `tmpcensored` now

1388

postfix=None, # only exist for `tmpcensored` now

1389

checkambig=False,

1389

checkambig=False,

1390

mmaplargeindex=False,

1390

mmaplargeindex=False,

1391

censorable=False,

1391

censorable=False,

1392

upperboundcomp=None,

1392

upperboundcomp=None,

1393

persistentnodemap=False,

1393

persistentnodemap=False,

1394

concurrencychecker=None,

1394

concurrencychecker=None,

1395

trypending=False,

1395

trypending=False,

1396

try_split=False,

1396

try_split=False,

1397

canonical_parent_order=True,

1397

canonical_parent_order=True,

1398

data_config=None,

1398

data_config=None,

1399

delta_config=None,

1399

delta_config=None,

1400

feature_config=None,

1400

feature_config=None,

1401

may_inline=True, # may inline new revlog

1401

may_inline=True, # may inline new revlog

1402

):

1402

):

1403

"""

1403

"""

1404

create a revlog object

1404

create a revlog object

1405

1406

opener is a function that abstracts the file opening operation

1406

opener is a function that abstracts the file opening operation

1407

and can be used to implement COW semantics or the like.

1407

and can be used to implement COW semantics or the like.

1408

1409

`target`: a (KIND, ID) tuple that identify the content stored in

1409

`target`: a (KIND, ID) tuple that identify the content stored in

1410

this revlog. It help the rest of the code to understand what the revlog

1410

this revlog. It help the rest of the code to understand what the revlog

1411

is about without having to resort to heuristic and index filename

1411

is about without having to resort to heuristic and index filename

1412

analysis. Note: that this must be reliably be set by normal code, but

1412

analysis. Note: that this must be reliably be set by normal code, but

1413

that test, debug, or performance measurement code might not set this to

1413

that test, debug, or performance measurement code might not set this to

1414

accurate value.

1414

accurate value.

1415

"""

1415

"""

1416

1417

self.radix = radix

1417

self.radix = radix

1418

1419

self._docket_file = None

1419

self._docket_file = None

1420

self._indexfile = None

1420

self._indexfile = None

1421

self._datafile = None

1421

self._datafile = None

1422

self._sidedatafile = None

1422

self._sidedatafile = None

1423

self._nodemap_file = None

1423

self._nodemap_file = None

1424

self.postfix = postfix

1424

self.postfix = postfix

1425

self._trypending = trypending

1425

self._trypending = trypending

1426

self._try_split = try_split

1426

self._try_split = try_split

1427

self._may_inline = may_inline

1427

self._may_inline = may_inline

1428

self.uses_rust = False

1428

self.uses_rust = False

1429

self.opener = opener

1429

self.opener = opener

1430

if persistentnodemap:

1430

if persistentnodemap:

1431

self._nodemap_file = nodemaputil.get_nodemap_file(self)

1431

self._nodemap_file = nodemaputil.get_nodemap_file(self)

1432

1433

assert target[0] in ALL_KINDS

1433

assert target[0] in ALL_KINDS

1434

assert len(target) == 2

1434

assert len(target) == 2

1435

self.target = target

1435

self.target = target

1436

if feature_config is not None:

1436

if feature_config is not None:

1437

self.feature_config = feature_config.copy()

1437

self.feature_config = feature_config.copy()

1438

elif b'feature-config' in self.opener.options:

1438

elif b'feature-config' in self.opener.options:

1439

self.feature_config = self.opener.options[b'feature-config'].copy()

1439

self.feature_config = self.opener.options[b'feature-config'].copy()

1440

else:

1440

else:

1441

self.feature_config = FeatureConfig()

1441

self.feature_config = FeatureConfig()

1442

self.feature_config.censorable = censorable

1442

self.feature_config.censorable = censorable

1443

self.feature_config.canonical_parent_order = canonical_parent_order

1443

self.feature_config.canonical_parent_order = canonical_parent_order

1444

if data_config is not None:

1444

if data_config is not None:

1445

self.data_config = data_config.copy()

1445

self.data_config = data_config.copy()

1446

elif b'data-config' in self.opener.options:

1446

elif b'data-config' in self.opener.options:

1447

self.data_config = self.opener.options[b'data-config'].copy()

1447

self.data_config = self.opener.options[b'data-config'].copy()

1448

else:

1448

else:

1449

self.data_config = DataConfig()

1449

self.data_config = DataConfig()

1450

self.data_config.check_ambig = checkambig

1450

self.data_config.check_ambig = checkambig

1451

self.data_config.mmap_large_index = mmaplargeindex

1451

self.data_config.mmap_large_index = mmaplargeindex

1452

if delta_config is not None:

1452

if delta_config is not None:

1453

self.delta_config = delta_config.copy()

1453

self.delta_config = delta_config.copy()

1454

elif b'delta-config' in self.opener.options:

1454

elif b'delta-config' in self.opener.options:

1455

self.delta_config = self.opener.options[b'delta-config'].copy()

1455

self.delta_config = self.opener.options[b'delta-config'].copy()

1456

else:

1456

else:

1457

self.delta_config = DeltaConfig()

1457

self.delta_config = DeltaConfig()

1458

self.delta_config.upper_bound_comp = upperboundcomp

1458

self.delta_config.upper_bound_comp = upperboundcomp

1459

1460

# Maps rev to chain base rev.

1460

# Maps rev to chain base rev.

1461

self._chainbasecache = util.lrucachedict(100)

1461

self._chainbasecache = util.lrucachedict(100)

1462

1463

self.index: Optional[BaseIndexObject] = None

1463

self.index: Optional[BaseIndexObject] = None

1464

self._docket = None

1464

self._docket = None

1465

self._nodemap_docket = None

1465

self._nodemap_docket = None

1466

# Mapping of partial identifiers to full nodes.

1466

# Mapping of partial identifiers to full nodes.

1467

self._pcache = {}

1467

self._pcache = {}

1468

1469

# other optionnals features

1469

# other optionnals features

1470

1471

# Make copy of flag processors so each revlog instance can support

1471

# Make copy of flag processors so each revlog instance can support

1472

# custom flags.

1472

# custom flags.

1473

self._flagprocessors = dict(flagutil.flagprocessors)

1473

self._flagprocessors = dict(flagutil.flagprocessors)

1474

# prevent nesting of addgroup

1474

# prevent nesting of addgroup

1475

self._adding_group = None

1475

self._adding_group = None

1476

1477

index, chunk_cache = self._loadindex()

1477

index, chunk_cache = self._loadindex()

1478

self._load_inner(index, chunk_cache)

1478

self._load_inner(index, chunk_cache)

1479

self._concurrencychecker = concurrencychecker

1479

self._concurrencychecker = concurrencychecker

1480

1481

def _init_opts(self):

1481

def _init_opts(self):

1482

"""process options (from above/config) to setup associated default revlog mode

1482

"""process options (from above/config) to setup associated default revlog mode

1483

1484

These values might be affected when actually reading on disk information.

1484

These values might be affected when actually reading on disk information.

1485

1486

The relevant values are returned for use in _loadindex().

1486

The relevant values are returned for use in _loadindex().

1487

1488

* newversionflags:

1488

* newversionflags:

1489

version header to use if we need to create a new revlog

1489

version header to use if we need to create a new revlog

1490

1491

* mmapindexthreshold:

1491

* mmapindexthreshold:

1492

minimal index size for start to use mmap

1492

minimal index size for start to use mmap

1493

1494

* force_nodemap:

1494

* force_nodemap:

1495

force the usage of a "development" version of the nodemap code

1495

force the usage of a "development" version of the nodemap code

1496

"""

1496

"""

1497

opts = self.opener.options

1497

opts = self.opener.options

1498

1499

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

1499

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

1500

new_header = CHANGELOGV2

1500

new_header = CHANGELOGV2

1501

compute_rank = opts.get(b'changelogv2.compute-rank', True)

1501

compute_rank = opts.get(b'changelogv2.compute-rank', True)

1502

self.feature_config.compute_rank = compute_rank

1502

self.feature_config.compute_rank = compute_rank

1503

elif b'revlogv2' in opts:

1503

elif b'revlogv2' in opts:

1504

new_header = REVLOGV2

1504

new_header = REVLOGV2

1505

elif b'revlogv1' in opts:

1505

elif b'revlogv1' in opts:

1506

new_header = REVLOGV1

1506

new_header = REVLOGV1

1507

if self._may_inline:

1507

if self._may_inline:

1508

new_header |= FLAG_INLINE_DATA

1508

new_header |= FLAG_INLINE_DATA

1509

if b'generaldelta' in opts:

1509

if b'generaldelta' in opts:

1510

new_header |= FLAG_GENERALDELTA

1510

new_header |= FLAG_GENERALDELTA

1511

elif b'revlogv0' in self.opener.options:

1511

elif b'revlogv0' in self.opener.options:

1512

new_header = REVLOGV0

1512

new_header = REVLOGV0

1513

else:

1513

else:

1514

new_header = REVLOG_DEFAULT_VERSION

1514

new_header = REVLOG_DEFAULT_VERSION

1515

1516

mmapindexthreshold = None

1516

mmapindexthreshold = None

1517

if self.data_config.mmap_large_index:

1517

if self.data_config.mmap_large_index:

1518

mmapindexthreshold = self.data_config.mmap_index_threshold

1518

mmapindexthreshold = self.data_config.mmap_index_threshold

1519

if self.feature_config.enable_ellipsis:

1519

if self.feature_config.enable_ellipsis:

1520

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

1520

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

1521

1522

# revlog v0 doesn't have flag processors

1522

# revlog v0 doesn't have flag processors

1523

for flag, processor in opts.get(b'flagprocessors', {}).items():

1523

for flag, processor in opts.get(b'flagprocessors', {}).items():

1524

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

1524

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

1525

1526

chunk_cache_size = self.data_config.chunk_cache_size

1526

chunk_cache_size = self.data_config.chunk_cache_size

1527

if chunk_cache_size <= 0:

1527

if chunk_cache_size <= 0:

1528

raise error.RevlogError(

1528

raise error.RevlogError(

1529

_(b'revlog chunk cache size %r is not greater than 0')

1529

_(b'revlog chunk cache size %r is not greater than 0')

1530

% chunk_cache_size

1530

% chunk_cache_size

1531

)

1531

)

1532

elif chunk_cache_size & (chunk_cache_size - 1):

1532

elif chunk_cache_size & (chunk_cache_size - 1):

1533

raise error.RevlogError(

1533

raise error.RevlogError(

1534

_(b'revlog chunk cache size %r is not a power of 2')

1534

_(b'revlog chunk cache size %r is not a power of 2')

1535

% chunk_cache_size

1535

% chunk_cache_size

1536

)

1536

)

1537

force_nodemap = opts.get(b'devel-force-nodemap', False)

1537

force_nodemap = opts.get(b'devel-force-nodemap', False)

1538

return new_header, mmapindexthreshold, force_nodemap

1538

return new_header, mmapindexthreshold, force_nodemap

1539

1540

def _get_data(self, filepath, mmap_threshold, size=None):

1540

def _get_data(self, filepath, mmap_threshold, size=None):

1541

"""return a file content with or without mmap

1541

"""return a file content with or without mmap

1542

1543

If the file is missing return the empty string"""

1543

If the file is missing return the empty string"""

1544

try:

1544

try:

1545

with self.opener(filepath) as fp:

1545

with self.opener(filepath) as fp:

1546

if mmap_threshold is not None:

1546

if mmap_threshold is not None:

1547

file_size = self.opener.fstat(fp).st_size

1547

file_size = self.opener.fstat(fp).st_size

1548

if (

1548

if (

1549

file_size >= mmap_threshold

1549

file_size >= mmap_threshold

1550

and self.opener.is_mmap_safe(filepath)

1550

and self.opener.is_mmap_safe(filepath)

1551

):

1551

):

1552

if size is not None:

1552

if size is not None:

1553

# avoid potentiel mmap crash

1553

# avoid potentiel mmap crash

1554

size = min(file_size, size)

1554

size = min(file_size, size)

1555

# TODO: should .close() to release resources without

1555

# TODO: should .close() to release resources without

1556

# relying on Python GC

1556

# relying on Python GC

1557

if size is None:

1557

if size is None:

1558

return util.buffer(util.mmapread(fp))

1558

return util.buffer(util.mmapread(fp))

1559

else:

1559

else:

1560

return util.buffer(util.mmapread(fp, size))

1560

return util.buffer(util.mmapread(fp, size))

1561

if size is None:

1561

if size is None:

1562

return fp.read()

1562

return fp.read()

1563

else:

1563

else:

1564

return fp.read(size)

1564

return fp.read(size)

1565

except FileNotFoundError:

1565

except FileNotFoundError:

1566

return b''

1566

return b''

1567

1568

def get_streams(self, max_linkrev, force_inline=False):

1568

def get_streams(self, max_linkrev, force_inline=False):

1569

"""return a list of streams that represent this revlog

1569

"""return a list of streams that represent this revlog

1570

1571

This is used by stream-clone to do bytes to bytes copies of a repository.

1571

This is used by stream-clone to do bytes to bytes copies of a repository.

1572

1573

This streams data for all revisions that refer to a changelog revision up

1573

This streams data for all revisions that refer to a changelog revision up

1574

to `max_linkrev`.

1574

to `max_linkrev`.

1575

1576

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

1576

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

1577

1578

It returns is a list of three-tuple:

1578

It returns is a list of three-tuple:

1579

1580

[

1580

[

1581

(filename, bytes_stream, stream_size),

1581

(filename, bytes_stream, stream_size),

1582

…

1582

…

1583

]

1583

]

1584

"""

1584

"""

1585

n = len(self)

1585

n = len(self)

1586

index = self.index

1586

index = self.index

1587

while n > 0:

1587

while n > 0:

1588

linkrev = index[n - 1][4]

1588

linkrev = index[n - 1][4]

1589

if linkrev < max_linkrev:

1589

if linkrev < max_linkrev:

1590

break

1590

break

1591

# note: this loop will rarely go through multiple iterations, since

1591

# note: this loop will rarely go through multiple iterations, since

1592

# it only traverses commits created during the current streaming

1592

# it only traverses commits created during the current streaming

1593

# pull operation.

1593

# pull operation.

1594

#

1594

#

1595

# If this become a problem, using a binary search should cap the

1595

# If this become a problem, using a binary search should cap the

1596

# runtime of this.

1596

# runtime of this.

1597

n = n - 1

1597

n = n - 1

1598

if n == 0:

1598

if n == 0:

1599

# no data to send

1599

# no data to send

1600

return []

1600

return []

1601

index_size = n * index.entry_size

1601

index_size = n * index.entry_size

1602

data_size = self.end(n - 1)

1602

data_size = self.end(n - 1)

1603

1604

# XXX we might have been split (or stripped) since the object

1604

# XXX we might have been split (or stripped) since the object

1605

# initialization, We need to close this race too, but having a way to

1605

# initialization, We need to close this race too, but having a way to

1606

# pre-open the file we feed to the revlog and never closing them before

1606

# pre-open the file we feed to the revlog and never closing them before

1607

# we are done streaming.

1607

# we are done streaming.

1608

1609

if self._inline:

1609

if self._inline:

1610

1611

def get_stream():

1611

def get_stream():

1612

with self.opener(self._indexfile, mode=b"r") as fp:

1612

with self.opener(self._indexfile, mode=b"r") as fp:

1613

yield None

1613

yield None

1614

size = index_size + data_size

1614

size = index_size + data_size

1615

if size <= 65536:

1615

if size <= 65536:

1616

yield fp.read(size)

1616

yield fp.read(size)

1617

else:

1617

else:

1618

yield from util.filechunkiter(fp, limit=size)

1618

yield from util.filechunkiter(fp, limit=size)

1619

1620

inline_stream = get_stream()

1620

inline_stream = get_stream()

1621

next(inline_stream)

1621

next(inline_stream)

1622

return [

1622

return [

1623

(self._indexfile, inline_stream, index_size + data_size),

1623

(self._indexfile, inline_stream, index_size + data_size),

1624

]

1624

]

1625

elif force_inline:

1625

elif force_inline:

1626

1627

def get_stream():

1627

def get_stream():

1628

with self.reading():

1628

with self.reading():

1629

yield None

1629

yield None

1630

1631

for rev in range(n):

1631

for rev in range(n):

1632

idx = self.index.entry_binary(rev)

1632

idx = self.index.entry_binary(rev)

1633

if rev == 0 and self._docket is None:

1633

if rev == 0 and self._docket is None:

1634

# re-inject the inline flag

1634

# re-inject the inline flag

1635

header = self._format_flags

1635

header = self._format_flags

1636

header |= self._format_version

1636

header |= self._format_version

1637

header |= FLAG_INLINE_DATA

1637

header |= FLAG_INLINE_DATA

1638

header = self.index.pack_header(header)

1638

header = self.index.pack_header(header)

1639

idx = header + idx

1639

idx = header + idx

1640

yield idx

1640

yield idx

1641

yield self._inner.get_segment_for_revs(rev, rev)[1]

1641

yield self._inner.get_segment_for_revs(rev, rev)[1]

1642

1643

inline_stream = get_stream()

1643

inline_stream = get_stream()

1644

next(inline_stream)

1644

next(inline_stream)

1645

return [

1645

return [

1646

(self._indexfile, inline_stream, index_size + data_size),

1646

(self._indexfile, inline_stream, index_size + data_size),

1647

]

1647

]

1648

else:

1648

else:

1649

1650

def get_index_stream():

1650

def get_index_stream():

1651

with self.opener(self._indexfile, mode=b"r") as fp:

1651

with self.opener(self._indexfile, mode=b"r") as fp:

1652

yield None

1652

yield None

1653

if index_size <= 65536:

1653

if index_size <= 65536:

1654

yield fp.read(index_size)

1654

yield fp.read(index_size)

1655

else:

1655

else:

1656

yield from util.filechunkiter(fp, limit=index_size)

1656

yield from util.filechunkiter(fp, limit=index_size)

1657

1658

def get_data_stream():

1658

def get_data_stream():

1659

with self._datafp() as fp:

1659

with self._datafp() as fp:

1660

yield None

1660

yield None

1661

if data_size <= 65536:

1661

if data_size <= 65536:

1662

yield fp.read(data_size)

1662

yield fp.read(data_size)

1663

else:

1663

else:

1664

yield from util.filechunkiter(fp, limit=data_size)

1664

yield from util.filechunkiter(fp, limit=data_size)

1665

1666

index_stream = get_index_stream()

1666

index_stream = get_index_stream()

1667

next(index_stream)

1667

next(index_stream)

1668

data_stream = get_data_stream()

1668

data_stream = get_data_stream()

1669

next(data_stream)

1669

next(data_stream)

1670

return [

1670

return [

1671

(self._datafile, data_stream, data_size),

1671

(self._datafile, data_stream, data_size),

1672

(self._indexfile, index_stream, index_size),

1672

(self._indexfile, index_stream, index_size),

1673

]

1673

]

1674

1675

def _loadindex(self, docket=None):

1675

def _loadindex(self, docket=None):

1676

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

1676

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

1677

1678

if self.postfix is not None:

1678

if self.postfix is not None:

1679

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

1679

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

1680

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

1680

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

1681

entry_point = b'%s.i.a' % self.radix

1681

entry_point = b'%s.i.a' % self.radix

1682

elif self._try_split and self.opener.exists(self._split_index_file):

1682

elif self._try_split and self.opener.exists(self._split_index_file):

1683

entry_point = self._split_index_file

1683

entry_point = self._split_index_file

1684

else:

1684

else:

1685

entry_point = b'%s.i' % self.radix

1685

entry_point = b'%s.i' % self.radix

1686

1687

if docket is not None:

1687

if docket is not None:

1688

self._docket = docket

1688

self._docket = docket

1689

self._docket_file = entry_point

1689

self._docket_file = entry_point

1690

else:

1690

else:

1691

self._initempty = True

1691

self._initempty = True

1692

entry_data = self._get_data(entry_point, mmapindexthreshold)

1692

entry_data = self._get_data(entry_point, mmapindexthreshold)

1693

if len(entry_data) > 0:

1693

if len(entry_data) > 0:

1694

header = INDEX_HEADER.unpack(entry_data[:4])[0]

1694

header = INDEX_HEADER.unpack(entry_data[:4])[0]

1695

self._initempty = False

1695

self._initempty = False

1696

else:

1696

else:

1697

header = new_header

1697

header = new_header

1698

1699

self._format_flags = header & ~0xFFFF

1699

self._format_flags = header & ~0xFFFF

1700

self._format_version = header & 0xFFFF

1700

self._format_version = header & 0xFFFF

1701

1702

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

1702

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

1703

if supported_flags is None:

1703

if supported_flags is None:

1704

msg = _(b'unknown version (%d) in revlog %s')

1704

msg = _(b'unknown version (%d) in revlog %s')

1705

msg %= (self._format_version, self.display_id)

1705

msg %= (self._format_version, self.display_id)

1706

raise error.RevlogError(msg)

1706

raise error.RevlogError(msg)

1707

elif self._format_flags & ~supported_flags:

1707

elif self._format_flags & ~supported_flags:

1708

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

1708

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

1709

display_flag = self._format_flags >> 16

1709

display_flag = self._format_flags >> 16

1710

msg %= (display_flag, self._format_version, self.display_id)

1710

msg %= (display_flag, self._format_version, self.display_id)

1711

raise error.RevlogError(msg)

1711

raise error.RevlogError(msg)

1712

1713

features = FEATURES_BY_VERSION[self._format_version]

1713

features = FEATURES_BY_VERSION[self._format_version]

1714

self._inline = features[b'inline'](self._format_flags)

1714

self._inline = features[b'inline'](self._format_flags)

1715

self.delta_config.general_delta = features[b'generaldelta'](

1715

self.delta_config.general_delta = features[b'generaldelta'](

1716

self._format_flags

1716

self._format_flags

1717

)

1717

)

1718

self.data_config.generaldelta = self.delta_config.general_delta

1718

self.data_config.generaldelta = self.delta_config.general_delta

1719

self.feature_config.has_side_data = features[b'sidedata']

1719

self.feature_config.has_side_data = features[b'sidedata']

1720

1721

if not features[b'docket']:

1721

if not features[b'docket']:

1722

self._indexfile = entry_point

1722

self._indexfile = entry_point

1723

index_data = entry_data

1723

index_data = entry_data

1724

else:

1724

else:

1725

self._docket_file = entry_point

1725

self._docket_file = entry_point

1726

if self._initempty:

1726

if self._initempty:

1727

self._docket = docketutil.default_docket(self, header)

1727

self._docket = docketutil.default_docket(self, header)

1728

else:

1728

else:

1729

self._docket = docketutil.parse_docket(

1729

self._docket = docketutil.parse_docket(

1730

self, entry_data, use_pending=self._trypending

1730

self, entry_data, use_pending=self._trypending

1731

)

1731

)

1732

1733

if self._docket is not None:

1733

if self._docket is not None:

1734

self._indexfile = self._docket.index_filepath()

1734

self._indexfile = self._docket.index_filepath()

1735

index_data = b''

1735

index_data = b''

1736

index_size = self._docket.index_end

1736

index_size = self._docket.index_end

1737

if index_size > 0:

1737

if index_size > 0:

1738

index_data = self._get_data(

1738

index_data = self._get_data(

1739

self._indexfile, mmapindexthreshold, size=index_size

1739

self._indexfile, mmapindexthreshold, size=index_size

1740

)

1740

)

1741

if len(index_data) < index_size:

1741

if len(index_data) < index_size:

1742

msg = _(b'too few index data for %s: got %d, expected %d')

1742

msg = _(b'too few index data for %s: got %d, expected %d')

1743

msg %= (self.display_id, len(index_data), index_size)

1743

msg %= (self.display_id, len(index_data), index_size)

1744

raise error.RevlogError(msg)

1744

raise error.RevlogError(msg)

1745

1746

self._inline = False

1746

self._inline = False

1747

# generaldelta implied by version 2 revlogs.

1747

# generaldelta implied by version 2 revlogs.

1748

self.delta_config.general_delta = True

1748

self.delta_config.general_delta = True

1749

self.data_config.generaldelta = True

1749

self.data_config.generaldelta = True

1750

# the logic for persistent nodemap will be dealt with within the

1750

# the logic for persistent nodemap will be dealt with within the

1751

# main docket, so disable it for now.

1751

# main docket, so disable it for now.

1752

self._nodemap_file = None

1752

self._nodemap_file = None

1753

1754

if self._docket is not None:

1754

if self._docket is not None:

1755

self._datafile = self._docket.data_filepath()

1755

self._datafile = self._docket.data_filepath()

1756

self._sidedatafile = self._docket.sidedata_filepath()

1756

self._sidedatafile = self._docket.sidedata_filepath()

1757

elif self.postfix is None:

1757

elif self.postfix is None:

1758

self._datafile = b'%s.d' % self.radix

1758

self._datafile = b'%s.d' % self.radix

1759

else:

1759

else:

1760

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

1760

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

1761

1762

self.nodeconstants = sha1nodeconstants

1762

self.nodeconstants = sha1nodeconstants

1763

self.nullid = self.nodeconstants.nullid

1763

self.nullid = self.nodeconstants.nullid

1764

1765

# sparse-revlog can't be on without general-delta (issue6056)

1765

# sparse-revlog can't be on without general-delta (issue6056)

1766

if not self.delta_config.general_delta:

1766

if not self.delta_config.general_delta:

1767

self.delta_config.sparse_revlog = False

1767

self.delta_config.sparse_revlog = False

1768

1769

self._storedeltachains = True

1769

self._storedeltachains = True

1770

1771

devel_nodemap = (

1771

devel_nodemap = (

1772

self._nodemap_file

1772

self._nodemap_file

1773

and force_nodemap

1773

and force_nodemap

1774

and parse_index_v1_nodemap is not None

1774

and parse_index_v1_nodemap is not None

1775

)

1775

)

1776

1777

use_rust_index = False

1777

use_rust_index = False

1778

rust_applicable = self._nodemap_file is not None

1778

rust_applicable = self._nodemap_file is not None

1779

rust_applicable = rust_applicable or self.target[0] == KIND_FILELOG

1779

rust_applicable = rust_applicable or self.target[0] == KIND_FILELOG

1780

rust_applicable = rust_applicable and getattr(

1780

rust_applicable = rust_applicable and getattr(

1781

self.opener, "rust_compatible", True

1781

self.opener, "rust_compatible", True

1782

)

1782

)

1783

if rustrevlog is not None and rust_applicable:

1783

if rustrevlog is not None and rust_applicable:

1784

# we would like to use the rust_index in all case, especially

1784

# we would like to use the rust_index in all case, especially

1785

# because it is necessary for AncestorsIterator and LazyAncestors

1785

# because it is necessary for AncestorsIterator and LazyAncestors

1786

# since the 6.7 cycle.

1786

# since the 6.7 cycle.

1787

#

1787

#

1788

# However, the performance impact of inconditionnaly building the

1788

# However, the performance impact of inconditionnaly building the

1789

# nodemap is currently a problem for non-persistent nodemap

1789

# nodemap is currently a problem for non-persistent nodemap

1790

# repository.

1790

# repository.

1791

use_rust_index = True

1791

use_rust_index = True

1792

1793

if self._format_version != REVLOGV1:

1793

if self._format_version != REVLOGV1:

1794

use_rust_index = False

1794

use_rust_index = False

1795

1796

if hasattr(self.opener, "fncache"):

1796

if hasattr(self.opener, "fncache"):

1797

vfs = self.opener.vfs

1797

vfs = self.opener.vfs

1798

if not self.opener.uses_dotencode:

1798

if not self.opener.uses_dotencode:

1799

use_rust_index = False

1799

use_rust_index = False

1800

if not isinstance(vfs, vfsmod.vfs):

1800

if not isinstance(vfs, vfsmod.vfs):

1801

# Be cautious since we don't support other vfs

1801

# Be cautious since we don't support other vfs

1802

use_rust_index = False

1802

use_rust_index = False

1803

else:

1803

else:

1804

# Rust only supports repos with fncache

1804

# Rust only supports repos with fncache

1805

use_rust_index = False

1805

use_rust_index = False

1806

1807

self._parse_index = parse_index_v1

1807

self._parse_index = parse_index_v1

1808

if self._format_version == REVLOGV0:

1808

if self._format_version == REVLOGV0:

1809

self._parse_index = revlogv0.parse_index_v0

1809

self._parse_index = revlogv0.parse_index_v0

1810

elif self._format_version == REVLOGV2:

1810

elif self._format_version == REVLOGV2:

1811

self._parse_index = parse_index_v2

1811

self._parse_index = parse_index_v2

1812

elif self._format_version == CHANGELOGV2:

1812

elif self._format_version == CHANGELOGV2:

1813

self._parse_index = parse_index_cl_v2

1813

self._parse_index = parse_index_cl_v2

1814

elif devel_nodemap:

1814

elif devel_nodemap:

1815

self._parse_index = parse_index_v1_nodemap

1815

self._parse_index = parse_index_v1_nodemap

1816

1817

if use_rust_index:

1817

if use_rust_index:

1818

# Let the Rust code parse its own index

1818

# Let the Rust code parse its own index

1819

index, chunkcache = (index_data, None)

1819

index, chunkcache = (index_data, None)

1820

self.uses_rust = True

1820

self.uses_rust = True

1821

else:

1821

else:

1822

try:

1822

try:

1823

d = self._parse_index(index_data, self._inline)

1823

d = self._parse_index(index_data, self._inline)

1824

index, chunkcache = d

1824

index, chunkcache = d

1825

self._register_nodemap_info(index)

1825

self._register_nodemap_info(index)

1826

except (ValueError, IndexError):

1826

except (ValueError, IndexError):

1827

raise error.RevlogError(

1827

raise error.RevlogError(

1828

_(b"index %s is corrupted") % self.display_id

1828

_(b"index %s is corrupted") % self.display_id

1829

)

1829

)

1830

# revnum -> (chain-length, sum-delta-length)

1830

# revnum -> (chain-length, sum-delta-length)

1831

self._chaininfocache = util.lrucachedict(500)

1831

self._chaininfocache = util.lrucachedict(500)

1832

1833

return index, chunkcache

1833

return index, chunkcache

1834

1835

def _load_inner(self, index, chunk_cache):

1835

def _load_inner(self, index, chunk_cache):

1836

if self._docket is None:

1836

if self._docket is None:

1837

default_compression_header = None

1837

default_compression_header = None

1838

else:

1838

else:

1839

default_compression_header = self._docket.default_compression_header

1839

default_compression_header = self._docket.default_compression_header

1840

1841

if self.uses_rust:

1841

if self.uses_rust:

1842

vfs_is_readonly = False

1842

vfs_is_readonly = False

1843

fncache = None

1843

fncache = None

1844

1845

if hasattr(self.opener, "vfs"):

1845

if hasattr(self.opener, "vfs"):

1846

vfs = self.opener

1846

vfs = self.opener

1847

if isinstance(vfs, vfsmod.readonlyvfs):

1847

if isinstance(vfs, vfsmod.readonlyvfs):

1848

vfs_is_readonly = True

1848

vfs_is_readonly = True

1849

vfs = vfs.vfs

1849

vfs = vfs.vfs

1850

fncache = vfs.fncache

1850

fncache = vfs.fncache

1851

vfs = vfs.vfs

1851

vfs = vfs.vfs

1852

else:

1852

else:

1853

vfs = self.opener

1853

vfs = self.opener

1854

1855

vfs_base = vfs.base

1855

vfs_base = vfs.base

1856

assert fncache is not None, "Rust only supports repos with fncache"

1856

assert fncache is not None, "Rust only supports repos with fncache"

1857

1858

self._inner = rustrevlog.InnerRevlog(

1858

self._inner = rustrevlog.InnerRevlog(

1859

vfs_base=vfs_base,

1859

vfs_base=vfs_base,

1860

fncache=fncache,

1860

fncache=fncache,

1861

vfs_is_readonly=vfs_is_readonly,

1861

vfs_is_readonly=vfs_is_readonly,

1862

index_data=index,

1862

index_data=index,

1863

index_file=self._indexfile,

1863

index_file=self._indexfile,

1864

data_file=self._datafile,

1864

data_file=self._datafile,

1865

sidedata_file=self._sidedatafile,

1865

sidedata_file=self._sidedatafile,

1866

inline=self._inline,

1866

inline=self._inline,

1867

data_config=self.data_config,

1867

data_config=self.data_config,

1868

delta_config=self.delta_config,

1868

delta_config=self.delta_config,

1869

feature_config=self.feature_config,

1869

feature_config=self.feature_config,

1870

chunk_cache=chunk_cache,

1870

chunk_cache=chunk_cache,

1871

default_compression_header=default_compression_header,

1871

default_compression_header=default_compression_header,

1872

revlog_type=self.target[0],

1872

revlog_type=self.target[0],

1873

use_persistent_nodemap=self._nodemap_file is not None,

1873

use_persistent_nodemap=self._nodemap_file is not None,

1874

)

1874

)

1875

self.index = RustIndexProxy(self._inner)

1875

self.index = RustIndexProxy(self._inner)

1876

self._register_nodemap_info(self.index)

1876

self._register_nodemap_info(self.index)

1877

self.uses_rust = True

1877

self.uses_rust = True

1878

else:

1878

else:

1879

self._inner = _InnerRevlog(

1879

self._inner = _InnerRevlog(

1880

opener=self.opener,

1880

opener=self.opener,

1881

index=index,

1881

index=index,

1882

index_file=self._indexfile,

1882

index_file=self._indexfile,

1883

data_file=self._datafile,

1883

data_file=self._datafile,

1884

sidedata_file=self._sidedatafile,

1884

sidedata_file=self._sidedatafile,

1885

inline=self._inline,

1885

inline=self._inline,

1886

data_config=self.data_config,

1886

data_config=self.data_config,

1887

delta_config=self.delta_config,

1887

delta_config=self.delta_config,

1888

feature_config=self.feature_config,

1888

feature_config=self.feature_config,

1889

chunk_cache=chunk_cache,

1889

chunk_cache=chunk_cache,

1890

default_compression_header=default_compression_header,

1890

default_compression_header=default_compression_header,

1891

)

1891

)

1892

self.index = self._inner.index

1892

self.index = self._inner.index

1893

1894

def _register_nodemap_info(self, index):

1894

def _register_nodemap_info(self, index):

1895

use_nodemap = (

1895

use_nodemap = (

1896

not self._inline

1896

not self._inline

1897

and self._nodemap_file is not None

1897

and self._nodemap_file is not None

1898

and hasattr(index, 'update_nodemap_data')

1898

and hasattr(index, 'update_nodemap_data')

1899

)

1899

)

1900

if use_nodemap:

1900

if use_nodemap:

1901

nodemap_data = nodemaputil.persisted_data(self)

1901

nodemap_data = nodemaputil.persisted_data(self)

1902

if nodemap_data is not None:

1902

if nodemap_data is not None:

1903

docket = nodemap_data[0]

1903

docket = nodemap_data[0]

1904

if (

1904

if (

1905

len(index) > docket.tip_rev

1905

len(index) > docket.tip_rev

1906

and index[docket.tip_rev][7] == docket.tip_node

1906

and index[docket.tip_rev][7] == docket.tip_node

1907

):

1907

):

1908

# no changelog tampering

1908

# no changelog tampering

1909

self._nodemap_docket = docket

1909

self._nodemap_docket = docket

1910

index.update_nodemap_data(

1910

index.update_nodemap_data(

1911

*nodemap_data

1911

*nodemap_data

1912

) # pytype: disable=attribute-error

1912

) # pytype: disable=attribute-error

1913

1914

def get_revlog(self):

1914

def get_revlog(self):

1915

"""simple function to mirror API of other not-really-revlog API"""

1915

"""simple function to mirror API of other not-really-revlog API"""

1916

return self

1916

return self

1917

1918

@util.propertycache

1918

@util.propertycache

1919

def revlog_kind(self):

1919

def revlog_kind(self):

1920

return self.target[0]

1920

return self.target[0]

1921

1922

@util.propertycache

1922

@util.propertycache

1923

def display_id(self):

1923

def display_id(self):

1924

"""The public facing "ID" of the revlog that we use in message"""

1924

"""The public facing "ID" of the revlog that we use in message"""

1925

if self.revlog_kind == KIND_FILELOG:

1925

if self.revlog_kind == KIND_FILELOG:

1926

# Reference the file without the "data/" prefix, so it is familiar

1926

# Reference the file without the "data/" prefix, so it is familiar

1927

# to the user.

1927

# to the user.

1928

return self.target[1]

1928

return self.target[1]

1929

else:

1929

else:

1930

return self.radix

1930

return self.radix

1931

1932

def _datafp(self, mode=b'r'):

1932

def _datafp(self, mode=b'r'):

1933

"""file object for the revlog's data file"""

1933

"""file object for the revlog's data file"""

1934

return self.opener(self._datafile, mode=mode)

1934

return self.opener(self._datafile, mode=mode)

1935

1936

def tiprev(self):

1936

def tiprev(self):

1937

return len(self.index) - 1

1937

return len(self.index) - 1

1938

1939

def tip(self):

1939

def tip(self):

1940

return self.node(self.tiprev())

1940

return self.node(self.tiprev())

1941

1942

def __contains__(self, rev):

1942

def __contains__(self, rev):

1943

return 0 <= rev < len(self)

1943

return 0 <= rev < len(self)

1944

1945

def __len__(self):

1945

def __len__(self):

1946

return len(self.index)

1946

return len(self.index)

1947

1948

def __iter__(self) -> Iterator[int]:

1948

def __iter__(self) -> Iterator[int]:

1949

return iter(range(len(self)))

1949

return iter(range(len(self)))

1950

1951

def revs(self, start=0, stop=None):

1951

def revs(self, start=0, stop=None):

1952

"""iterate over all rev in this revlog (from start to stop)"""

1952

"""iterate over all rev in this revlog (from start to stop)"""

1953

return storageutil.iterrevs(len(self), start=start, stop=stop)

1953

return storageutil.iterrevs(len(self), start=start, stop=stop)

1954

1955

def hasnode(self, node):

1955

def hasnode(self, node):

1956

try:

1956

try:

1957

self.rev(node)

1957

self.rev(node)

1958

return True

1958

return True

1959

except KeyError:

1959

except KeyError:

1960

return False

1960

return False

1961

1962

def _candelta(self, baserev, rev):

1962

def _candelta(self, baserev, rev):

1963

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1963

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1964

# Disable delta if either rev requires a content-changing flag

1964

# Disable delta if either rev requires a content-changing flag

1965

# processor (ex. LFS). This is because such flag processor can alter

1965

# processor (ex. LFS). This is because such flag processor can alter

1966

# the rawtext content that the delta will be based on, and two clients

1966

# the rawtext content that the delta will be based on, and two clients

1967

# could have a same revlog node with different flags (i.e. different

1967

# could have a same revlog node with different flags (i.e. different

1968

# rawtext contents) and the delta could be incompatible.

1968

# rawtext contents) and the delta could be incompatible.

1969

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1969

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1970

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1970

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1971

):

1971

):

1972

return False

1972

return False

1973

return True

1973

return True

1974

1975

def update_caches(self, transaction):

1975

def update_caches(self, transaction):

1976

"""update on disk cache

1976

"""update on disk cache

1977

1978

If a transaction is passed, the update may be delayed to transaction

1978

If a transaction is passed, the update may be delayed to transaction

1979

commit."""

1979

commit."""

1980

if self._nodemap_file is not None:

1980

if self._nodemap_file is not None:

1981

if transaction is None:

1981

if transaction is None:

1982

nodemaputil.update_persistent_nodemap(self)

1982

nodemaputil.update_persistent_nodemap(self)

1983

else:

1983

else:

1984

nodemaputil.setup_persistent_nodemap(transaction, self)

1984

nodemaputil.setup_persistent_nodemap(transaction, self)

1985

1986

def clearcaches(self, clear_persisted_data: bool = False) -> None:

1986

def clearcaches(self, clear_persisted_data: bool = False) -> None:

1987

"""Clear in-memory caches"""

1987

"""Clear in-memory caches"""

1988

self._chainbasecache.clear()

1988

self._chainbasecache.clear()

1989

self._inner.clear_cache()

1989

self._inner.clear_cache()

1990

self._pcache = {}

1990

self._pcache = {}

1991

self._nodemap_docket = None

1991

self._nodemap_docket = None

1992

self.index.clearcaches()

1992

self.index.clearcaches()

1993

# The python code is the one responsible for validating the docket, we

1993

# The python code is the one responsible for validating the docket, we

1994

# end up having to refresh it here.

1994

# end up having to refresh it here.

1995

use_nodemap = (

1995

use_nodemap = (

1996

not self._inline

1996

not self._inline

1997

and self._nodemap_file is not None

1997

and self._nodemap_file is not None

1998

and hasattr(self.index, 'update_nodemap_data')

1998

and hasattr(self.index, 'update_nodemap_data')

1999

)

1999

)

2000

if use_nodemap:

2000

if use_nodemap:

2001

nodemap_data = nodemaputil.persisted_data(self)

2001

nodemap_data = nodemaputil.persisted_data(self)

2002

if nodemap_data is not None:

2002

if nodemap_data is not None:

2003

self._nodemap_docket = nodemap_data[0]

2003

self._nodemap_docket = nodemap_data[0]

2004

self.index.update_nodemap_data(

2004

self.index.update_nodemap_data(

2005

*nodemap_data

2005

*nodemap_data

2006

) # pytype: disable=attribute-error

2006

) # pytype: disable=attribute-error

2007

2008

def rev(self, node):

2008

def rev(self, node):

2009

"""return the revision number associated with a <nodeid>"""

2009

"""return the revision number associated with a <nodeid>"""

2010

try:

2010

try:

2011

return self.index.rev(node)

2011

return self.index.rev(node)

2012

except TypeError:

2012

except TypeError:

2013

raise

2013

raise

2014

except error.RevlogError:

2014

except error.RevlogError:

2015

# parsers.c radix tree lookup failed

2015

# parsers.c radix tree lookup failed

2016

if (

2016

if (

2017

node == self.nodeconstants.wdirid

2017

node == self.nodeconstants.wdirid

2018

or node in self.nodeconstants.wdirfilenodeids

2018

or node in self.nodeconstants.wdirfilenodeids

2019

):

2019

):

2020

raise error.WdirUnsupported

2020

raise error.WdirUnsupported

2021

raise error.LookupError(node, self.display_id, _(b'no node'))

2021

raise error.LookupError(node, self.display_id, _(b'no node'))

2022

2023

# Accessors for index entries.

2023

# Accessors for index entries.

2024

2025

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

2025

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

2026

# are flags.

2026

# are flags.

2027

def start(self, rev):

2027

def start(self, rev):

2028

return int(self.index[rev][0] >> 16)

2028

return int(self.index[rev][0] >> 16)

2029

2030

def sidedata_cut_off(self, rev):

2030

def sidedata_cut_off(self, rev):

2031

sd_cut_off = self.index[rev][8]

2031

sd_cut_off = self.index[rev][8]

2032

if sd_cut_off != 0:

2032

if sd_cut_off != 0:

2033

return sd_cut_off

2033

return sd_cut_off

2034

# This is some annoying dance, because entries without sidedata

2034

# This is some annoying dance, because entries without sidedata

2035

# currently use 0 as their ofsset. (instead of previous-offset +

2035

# currently use 0 as their ofsset. (instead of previous-offset +

2036

# previous-size)

2036

# previous-size)

2037

#

2037

#

2038

# We should reconsider this sidedata → 0 sidata_offset policy.

2038

# We should reconsider this sidedata → 0 sidata_offset policy.

2039

# In the meantime, we need this.

2039

# In the meantime, we need this.

2040

while 0 <= rev:

2040

while 0 <= rev:

2041

e = self.index[rev]

2041

e = self.index[rev]

2042

if e[9] != 0:

2042

if e[9] != 0:

2043

return e[8] + e[9]

2043

return e[8] + e[9]

2044

rev -= 1

2044

rev -= 1

2045

return 0

2045

return 0

2046

2047

def flags(self, rev):

2047

def flags(self, rev):

2048

return self.index[rev][0] & 0xFFFF

2048

return self.index[rev][0] & 0xFFFF

2049

2050

def length(self, rev):

2050

def length(self, rev):

2051

return self.index[rev][1]

2051

return self.index[rev][1]

2052

2053

def sidedata_length(self, rev):

2053

def sidedata_length(self, rev):

2054

if not self.feature_config.has_side_data:

2054

if not self.feature_config.has_side_data:

2055

return 0

2055

return 0

2056

return self.index[rev][9]

2056

return self.index[rev][9]

2057

2058

def rawsize(self, rev):

2058

def rawsize(self, rev):

2059

"""return the length of the uncompressed text for a given revision"""

2059

"""return the length of the uncompressed text for a given revision"""

2060

l = self.index[rev][2]

2060

l = self.index[rev][2]

2061

if l >= 0:

2061

if l >= 0:

2062

return l

2062

return l

2063

2064

t = self.rawdata(rev)

2064

t = self.rawdata(rev)

2065

return len(t)

2065

return len(t)

2066

2067

def size(self, rev):

2067

def size(self, rev):

2068

"""length of non-raw text (processed by a "read" flag processor)"""

2068

"""length of non-raw text (processed by a "read" flag processor)"""

2069

# fast path: if no "read" flag processor could change the content,

2069

# fast path: if no "read" flag processor could change the content,

2070

# size is rawsize. note: ELLIPSIS is known to not change the content.

2070

# size is rawsize. note: ELLIPSIS is known to not change the content.

2071

flags = self.flags(rev)

2071

flags = self.flags(rev)

2072

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

2072

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

2073

return self.rawsize(rev)

2073

return self.rawsize(rev)

2074

2075

return len(self.revision(rev))

2075

return len(self.revision(rev))

2076

2077

def fast_rank(self, rev):

2077

def fast_rank(self, rev):

2078

"""Return the rank of a revision if already known, or None otherwise.

2078

"""Return the rank of a revision if already known, or None otherwise.

2079

2080

The rank of a revision is the size of the sub-graph it defines as a

2080

The rank of a revision is the size of the sub-graph it defines as a

2081

head. Equivalently, the rank of a revision `r` is the size of the set

2081

head. Equivalently, the rank of a revision `r` is the size of the set

2082

`ancestors(r)`, `r` included.

2082

`ancestors(r)`, `r` included.

2083

2084

This method returns the rank retrieved from the revlog in constant

2084

This method returns the rank retrieved from the revlog in constant

2085

time. It makes no attempt at computing unknown values for versions of

2085

time. It makes no attempt at computing unknown values for versions of

2086

the revlog which do not persist the rank.

2086

the revlog which do not persist the rank.

2087

"""

2087

"""

2088

rank = self.index[rev][ENTRY_RANK]

2088

rank = self.index[rev][ENTRY_RANK]

2089

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

2089

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

2090

return None

2090

return None

2091

if rev == nullrev:

2091

if rev == nullrev:

2092

return 0 # convention

2092

return 0 # convention

2093

return rank

2093

return rank

2094

2095

def chainbase(self, rev):

2095

def chainbase(self, rev):

2096

base = self._chainbasecache.get(rev)

2096

base = self._chainbasecache.get(rev)

2097

if base is not None:

2097

if base is not None:

2098

return base

2098

return base

2099

2100

index = self.index

2100

index = self.index

2101

iterrev = rev

2101

iterrev = rev

2102

base = index[iterrev][3]

2102

base = index[iterrev][3]

2103

while base != iterrev:

2103

while base != iterrev:

2104

iterrev = base

2104

iterrev = base

2105

base = index[iterrev][3]

2105

base = index[iterrev][3]

2106

2107

self._chainbasecache[rev] = base

2107

self._chainbasecache[rev] = base

2108

return base

2108

return base

2109

2110

def linkrev(self, rev):

2110

def linkrev(self, rev):

2111

return self.index[rev][4]

2111

return self.index[rev][4]

2112

2113

def parentrevs(self, rev):

2113

def parentrevs(self, rev):

2114

try:

2114

try:

2115

entry = self.index[rev]

2115

entry = self.index[rev]

2116

except IndexError:

2116

except IndexError:

2117

if rev == wdirrev:

2117

if rev == wdirrev:

2118

raise error.WdirUnsupported

2118

raise error.WdirUnsupported

2119

raise

2119

raise

2120

2121

if self.feature_config.canonical_parent_order and entry[5] == nullrev:

2121

if self.feature_config.canonical_parent_order and entry[5] == nullrev:

2122

return entry[6], entry[5]

2122

return entry[6], entry[5]

2123

else:

2123

else:

2124

return entry[5], entry[6]

2124

return entry[5], entry[6]

2125

2126

# fast parentrevs(rev) where rev isn't filtered

2126

# fast parentrevs(rev) where rev isn't filtered

2127

_uncheckedparentrevs = parentrevs

2127

_uncheckedparentrevs = parentrevs

2128

2129

def node(self, rev):

2129

def node(self, rev):

2130

try:

2130

try:

2131

return self.index[rev][7]

2131

return self.index[rev][7]

2132

except IndexError:

2132

except IndexError:

2133

if rev == wdirrev:

2133

if rev == wdirrev:

2134

raise error.WdirUnsupported

2134

raise error.WdirUnsupported

2135

raise

2135

raise

2136

2137

# Derived from index values.

2137

# Derived from index values.

2138

2139

def end(self, rev):

2139

def end(self, rev):

2140

return self.start(rev) + self.length(rev)

2140

return self.start(rev) + self.length(rev)

2141

2142

def parents(self, node):

2142

def parents(self, node):

2143

i = self.index

2143

i = self.index

2144

d = i[self.rev(node)]

2144

d = i[self.rev(node)]

2145

# inline node() to avoid function call overhead

2145

# inline node() to avoid function call overhead

2146

if self.feature_config.canonical_parent_order and d[5] == self.nullid:

2146

if self.feature_config.canonical_parent_order and d[5] == self.nullid:

2147

return i[d[6]][7], i[d[5]][7]

2147

return i[d[6]][7], i[d[5]][7]

2148

else:

2148

else:

2149

return i[d[5]][7], i[d[6]][7]

2149

return i[d[5]][7], i[d[6]][7]

2150

2151

def chainlen(self, rev):

2151

def chainlen(self, rev):

2152

return self._chaininfo(rev)[0]

2152

return self._chaininfo(rev)[0]

2153

2154

def _chaininfo(self, rev):

2154

def _chaininfo(self, rev):

2155

chaininfocache = self._chaininfocache

2155

chaininfocache = self._chaininfocache

2156

if rev in chaininfocache:

2156

if rev in chaininfocache:

2157

return chaininfocache[rev]

2157

return chaininfocache[rev]

2158

index = self.index

2158

index = self.index

2159

generaldelta = self.delta_config.general_delta

2159

generaldelta = self.delta_config.general_delta

2160

iterrev = rev

2160

iterrev = rev

2161

e = index[iterrev]

2161

e = index[iterrev]

2162

clen = 0

2162

clen = 0

2163

compresseddeltalen = 0

2163

compresseddeltalen = 0

2164

while iterrev != e[3]:

2164

while iterrev != e[3]:

2165

clen += 1

2165

clen += 1

2166

compresseddeltalen += e[1]

2166

compresseddeltalen += e[1]

2167

if generaldelta:

2167

if generaldelta:

2168

iterrev = e[3]

2168

iterrev = e[3]

2169

else:

2169

else:

2170

iterrev -= 1

2170

iterrev -= 1

2171

if iterrev in chaininfocache:

2171

if iterrev in chaininfocache:

2172

t = chaininfocache[iterrev]

2172

t = chaininfocache[iterrev]

2173

clen += t[0]

2173

clen += t[0]

2174

compresseddeltalen += t[1]

2174

compresseddeltalen += t[1]

2175

break

2175

break

2176

e = index[iterrev]

2176

e = index[iterrev]

2177

else:

2177

else:

2178

# Add text length of base since decompressing that also takes

2178

# Add text length of base since decompressing that also takes

2179

# work. For cache hits the length is already included.

2179

# work. For cache hits the length is already included.

2180

compresseddeltalen += e[1]

2180

compresseddeltalen += e[1]

2181

r = (clen, compresseddeltalen)

2181

r = (clen, compresseddeltalen)

2182

chaininfocache[rev] = r

2182

chaininfocache[rev] = r

2183

return r

2183

return r

2184

2185

def _deltachain(self, rev, stoprev=None):

2185

def _deltachain(self, rev, stoprev=None):

2186

return self._inner._deltachain(rev, stoprev=stoprev)

2186

return self._inner._deltachain(rev, stoprev=stoprev)

2187

2188

def ancestors(self, revs, stoprev=0, inclusive=False):

2188

def ancestors(self, revs, stoprev=0, inclusive=False):

2189

"""Generate the ancestors of 'revs' in reverse revision order.

2189

"""Generate the ancestors of 'revs' in reverse revision order.

2190

Does not generate revs lower than stoprev.

2190

Does not generate revs lower than stoprev.

2191

2192

See the documentation for ancestor.lazyancestors for more details."""

2192

See the documentation for ancestor.lazyancestors for more details."""

2193

2194

# first, make sure start revisions aren't filtered

2194

# first, make sure start revisions aren't filtered

2195

revs = list(revs)

2195

revs = list(revs)

2196

checkrev = self.node

2196

checkrev = self.node

2197

for r in revs:

2197

for r in revs:

2198

checkrev(r)

2198

checkrev(r)

2199

# and we're sure ancestors aren't filtered as well

2199

# and we're sure ancestors aren't filtered as well

2200

2201

if rustancestor is not None and self.index.rust_ext_compat:

2201

if rustancestor is not None and self.index.rust_ext_compat:

2202

lazyancestors = rustancestor.LazyAncestors

2202

lazyancestors = rustancestor.LazyAncestors

2203

arg = self.index

2203

arg = self.index

2204

else:

2204

else:

2205

lazyancestors = ancestor.lazyancestors

2205

lazyancestors = ancestor.lazyancestors

2206

arg = self._uncheckedparentrevs

2206

arg = self._uncheckedparentrevs

2207

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

2207

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

2208

2209

def descendants(self, revs):

2209

def descendants(self, revs):

2210

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

2210

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

2211

2212

def findcommonmissing(self, common=None, heads=None):

2212

def findcommonmissing(self, common=None, heads=None):

2213

"""Return a tuple of the ancestors of common and the ancestors of heads

2213

"""Return a tuple of the ancestors of common and the ancestors of heads

2214

that are not ancestors of common. In revset terminology, we return the

2214

that are not ancestors of common. In revset terminology, we return the

2215

tuple:

2215

tuple:

2216

2217

::common, (::heads) - (::common)

2217

::common, (::heads) - (::common)

2218

2219

The list is sorted by revision number, meaning it is

2219

The list is sorted by revision number, meaning it is

2220

topologically sorted.

2220

topologically sorted.

2221

2222

'heads' and 'common' are both lists of node IDs. If heads is

2222

'heads' and 'common' are both lists of node IDs. If heads is

2223

not supplied, uses all of the revlog's heads. If common is not

2223

not supplied, uses all of the revlog's heads. If common is not

2224

supplied, uses nullid."""

2224

supplied, uses nullid."""

2225

if common is None:

2225

if common is None:

2226

common = [self.nullid]

2226

common = [self.nullid]

2227

if heads is None:

2227

if heads is None:

2228

heads = self.heads()

2228

heads = self.heads()

2229

2230

common = [self.rev(n) for n in common]

2230

common = [self.rev(n) for n in common]

2231

heads = [self.rev(n) for n in heads]

2231

heads = [self.rev(n) for n in heads]

2232

2233

# we want the ancestors, but inclusive

2233

# we want the ancestors, but inclusive

2234

class lazyset:

2234

class lazyset:

2235

def __init__(self, lazyvalues):

2235

def __init__(self, lazyvalues):

2236

self.addedvalues = set()

2236

self.addedvalues = set()

2237

self.lazyvalues = lazyvalues

2237

self.lazyvalues = lazyvalues

2238

2239

def __contains__(self, value):

2239

def __contains__(self, value):

2240

return value in self.addedvalues or value in self.lazyvalues

2240

return value in self.addedvalues or value in self.lazyvalues

2241

2242

def __iter__(self):

2242

def __iter__(self):

2243

added = self.addedvalues

2243

added = self.addedvalues

2244

for r in added:

2244

for r in added:

2245

yield r

2245

yield r

2246

for r in self.lazyvalues:

2246

for r in self.lazyvalues:

2247

if not r in added:

2247

if not r in added:

2248

yield r

2248

yield r

2249

2250

def add(self, value):

2250

def add(self, value):

2251

self.addedvalues.add(value)

2251

self.addedvalues.add(value)

2252

2253

def update(self, values):

2253

def update(self, values):

2254

self.addedvalues.update(values)

2254

self.addedvalues.update(values)

2255

2256

has = lazyset(self.ancestors(common))

2256

has = lazyset(self.ancestors(common))

2257

has.add(nullrev)

2257

has.add(nullrev)

2258

has.update(common)

2258

has.update(common)

2259

2260

# take all ancestors from heads that aren't in has

2260

# take all ancestors from heads that aren't in has

2261

missing = set()

2261

missing = set()

2262

visit = collections.deque(r for r in heads if r not in has)

2262

visit = collections.deque(r for r in heads if r not in has)

2263

while visit:

2263

while visit:

2264

r = visit.popleft()

2264

r = visit.popleft()

2265

if r in missing:

2265

if r in missing:

2266

continue

2266

continue

2267

else:

2267

else:

2268

missing.add(r)

2268

missing.add(r)

2269

for p in self.parentrevs(r):

2269

for p in self.parentrevs(r):

2270

if p not in has:

2270

if p not in has:

2271

visit.append(p)

2271

visit.append(p)

2272

missing = list(missing)

2272

missing = list(missing)

2273

missing.sort()

2273

missing.sort()

2274

return has, [self.node(miss) for miss in missing]

2274

return has, [self.node(miss) for miss in missing]

2275

2276

def incrementalmissingrevs(self, common=None):

2276

def incrementalmissingrevs(self, common=None):

2277

"""Return an object that can be used to incrementally compute the

2277

"""Return an object that can be used to incrementally compute the

2278

revision numbers of the ancestors of arbitrary sets that are not

2278

revision numbers of the ancestors of arbitrary sets that are not

2279

ancestors of common. This is an ancestor.incrementalmissingancestors

2279

ancestors of common. This is an ancestor.incrementalmissingancestors

2280

object.

2280

object.

2281

2282

'common' is a list of revision numbers. If common is not supplied, uses

2282

'common' is a list of revision numbers. If common is not supplied, uses

2283

nullrev.

2283

nullrev.

2284

"""

2284

"""

2285

if common is None:

2285

if common is None:

2286

common = [nullrev]

2286

common = [nullrev]

2287

2288

if rustancestor is not None and self.index.rust_ext_compat:

2288

if rustancestor is not None and self.index.rust_ext_compat:

2289

return rustancestor.MissingAncestors(self.index, common)

2289

return rustancestor.MissingAncestors(self.index, common)

2290

return ancestor.incrementalmissingancestors(self.parentrevs, common)

2290

return ancestor.incrementalmissingancestors(self.parentrevs, common)

2291

2292

def findmissingrevs(self, common=None, heads=None):

2292

def findmissingrevs(self, common=None, heads=None):

2293

"""Return the revision numbers of the ancestors of heads that

2293

"""Return the revision numbers of the ancestors of heads that

2294

are not ancestors of common.

2294

are not ancestors of common.

2295

2296

More specifically, return a list of revision numbers corresponding to

2296

More specifically, return a list of revision numbers corresponding to

2297

nodes N such that every N satisfies the following constraints:

2297

nodes N such that every N satisfies the following constraints:

2298

2299

1. N is an ancestor of some node in 'heads'

2299

1. N is an ancestor of some node in 'heads'

2300

2. N is not an ancestor of any node in 'common'

2300

2. N is not an ancestor of any node in 'common'

2301

2302

The list is sorted by revision number, meaning it is

2302

The list is sorted by revision number, meaning it is

2303

topologically sorted.

2303

topologically sorted.

2304

2305

'heads' and 'common' are both lists of revision numbers. If heads is

2305

'heads' and 'common' are both lists of revision numbers. If heads is

2306

not supplied, uses all of the revlog's heads. If common is not

2306

not supplied, uses all of the revlog's heads. If common is not

2307

supplied, uses nullid."""

2307

supplied, uses nullid."""

2308

if common is None:

2308

if common is None:

2309

common = [nullrev]

2309

common = [nullrev]

2310

if heads is None:

2310

if heads is None:

2311

heads = self.headrevs()

2311

heads = self.headrevs()

2312

2313

inc = self.incrementalmissingrevs(common=common)

2313

inc = self.incrementalmissingrevs(common=common)

2314

return inc.missingancestors(heads)

2314

return inc.missingancestors(heads)

2315

2316

def findmissing(self, common=None, heads=None):

2316

def findmissing(self, common=None, heads=None):

2317

"""Return the ancestors of heads that are not ancestors of common.

2317

"""Return the ancestors of heads that are not ancestors of common.

2318

2319

More specifically, return a list of nodes N such that every N

2319

More specifically, return a list of nodes N such that every N

2320

satisfies the following constraints:

2320

satisfies the following constraints:

2321

2322

1. N is an ancestor of some node in 'heads'

2322

1. N is an ancestor of some node in 'heads'

2323

2. N is not an ancestor of any node in 'common'

2323

2. N is not an ancestor of any node in 'common'

2324

2325

The list is sorted by revision number, meaning it is

2325

The list is sorted by revision number, meaning it is

2326

topologically sorted.

2326

topologically sorted.

2327

2328

'heads' and 'common' are both lists of node IDs. If heads is

2328

'heads' and 'common' are both lists of node IDs. If heads is

2329

not supplied, uses all of the revlog's heads. If common is not

2329

not supplied, uses all of the revlog's heads. If common is not

2330

supplied, uses nullid."""

2330

supplied, uses nullid."""

2331

if common is None:

2331

if common is None:

2332

common = [self.nullid]

2332

common = [self.nullid]

2333

if heads is None:

2333

if heads is None:

2334

heads = self.heads()

2334

heads = self.heads()

2335

2336

common = [self.rev(n) for n in common]

2336

common = [self.rev(n) for n in common]

2337

heads = [self.rev(n) for n in heads]

2337

heads = [self.rev(n) for n in heads]

2338

2339

inc = self.incrementalmissingrevs(common=common)

2339

inc = self.incrementalmissingrevs(common=common)

2340

return [self.node(r) for r in inc.missingancestors(heads)]

2340

return [self.node(r) for r in inc.missingancestors(heads)]

2341

2342

def nodesbetween(self, roots=None, heads=None):

2342

def nodesbetween(self, roots=None, heads=None):

2343

"""Return a topological path from 'roots' to 'heads'.

2343

"""Return a topological path from 'roots' to 'heads'.

2344

2345

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

2345

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

2346

topologically sorted list of all nodes N that satisfy both of

2346

topologically sorted list of all nodes N that satisfy both of

2347

these constraints:

2347

these constraints:

2348

2349

1. N is a descendant of some node in 'roots'

2349

1. N is a descendant of some node in 'roots'

2350

2. N is an ancestor of some node in 'heads'

2350

2. N is an ancestor of some node in 'heads'

2351

2352

Every node is considered to be both a descendant and an ancestor

2352

Every node is considered to be both a descendant and an ancestor

2353

of itself, so every reachable node in 'roots' and 'heads' will be

2353

of itself, so every reachable node in 'roots' and 'heads' will be

2354

included in 'nodes'.

2354

included in 'nodes'.

2355

2356

'outroots' is the list of reachable nodes in 'roots', i.e., the

2356

'outroots' is the list of reachable nodes in 'roots', i.e., the

2357

subset of 'roots' that is returned in 'nodes'. Likewise,

2357

subset of 'roots' that is returned in 'nodes'. Likewise,

2358

'outheads' is the subset of 'heads' that is also in 'nodes'.

2358

'outheads' is the subset of 'heads' that is also in 'nodes'.

2359

2360

'roots' and 'heads' are both lists of node IDs. If 'roots' is

2360

'roots' and 'heads' are both lists of node IDs. If 'roots' is

2361

unspecified, uses nullid as the only root. If 'heads' is

2361

unspecified, uses nullid as the only root. If 'heads' is

2362

unspecified, uses list of all of the revlog's heads."""

2362

unspecified, uses list of all of the revlog's heads."""

2363

nonodes = ([], [], [])

2363

nonodes = ([], [], [])

2364

if roots is not None:

2364

if roots is not None:

2365

roots = list(roots)

2365

roots = list(roots)

2366

if not roots:

2366

if not roots:

2367

return nonodes

2367

return nonodes

2368

lowestrev = min([self.rev(n) for n in roots])

2368

lowestrev = min([self.rev(n) for n in roots])

2369

else:

2369

else:

2370

roots = [self.nullid] # Everybody's a descendant of nullid

2370

roots = [self.nullid] # Everybody's a descendant of nullid

2371

lowestrev = nullrev

2371

lowestrev = nullrev

2372

if (lowestrev == nullrev) and (heads is None):

2372

if (lowestrev == nullrev) and (heads is None):

2373

# We want _all_ the nodes!

2373

# We want _all_ the nodes!

2374

return (

2374

return (

2375

[self.node(r) for r in self],

2375

[self.node(r) for r in self],

2376

[self.nullid],

2376

[self.nullid],

2377

list(self.heads()),

2377

list(self.heads()),

2378

)

2378

)

2379

if heads is None:

2379

if heads is None:

2380

# All nodes are ancestors, so the latest ancestor is the last

2380

# All nodes are ancestors, so the latest ancestor is the last

2381

# node.

2381

# node.

2382

highestrev = len(self) - 1

2382

highestrev = len(self) - 1

2383

# Set ancestors to None to signal that every node is an ancestor.

2383

# Set ancestors to None to signal that every node is an ancestor.

2384

ancestors = None

2384

ancestors = None

2385

# Set heads to an empty dictionary for later discovery of heads

2385

# Set heads to an empty dictionary for later discovery of heads

2386

heads = {}

2386

heads = {}

2387

else:

2387

else:

2388

heads = list(heads)

2388

heads = list(heads)

2389

if not heads:

2389

if not heads:

2390

return nonodes

2390

return nonodes

2391

ancestors = set()

2391

ancestors = set()

2392

# Turn heads into a dictionary so we can remove 'fake' heads.

2392

# Turn heads into a dictionary so we can remove 'fake' heads.

2393

# Also, later we will be using it to filter out the heads we can't

2393

# Also, later we will be using it to filter out the heads we can't

2394

# find from roots.

2394

# find from roots.

2395

heads = dict.fromkeys(heads, False)

2395

heads = dict.fromkeys(heads, False)

2396

# Start at the top and keep marking parents until we're done.

2396

# Start at the top and keep marking parents until we're done.

2397

nodestotag = set(heads)

2397

nodestotag = set(heads)

2398

# Remember where the top was so we can use it as a limit later.

2398

# Remember where the top was so we can use it as a limit later.

2399

highestrev = max([self.rev(n) for n in nodestotag])

2399

highestrev = max([self.rev(n) for n in nodestotag])

2400

while nodestotag:

2400

while nodestotag:

2401

# grab a node to tag

2401

# grab a node to tag

2402

n = nodestotag.pop()

2402

n = nodestotag.pop()

2403

# Never tag nullid

2403

# Never tag nullid

2404

if n == self.nullid:

2404

if n == self.nullid:

2405

continue

2405

continue

2406

# A node's revision number represents its place in a

2406

# A node's revision number represents its place in a

2407

# topologically sorted list of nodes.

2407

# topologically sorted list of nodes.

2408

r = self.rev(n)

2408

r = self.rev(n)

2409

if r >= lowestrev:

2409

if r >= lowestrev:

2410

if n not in ancestors:

2410

if n not in ancestors:

2411

# If we are possibly a descendant of one of the roots

2411

# If we are possibly a descendant of one of the roots

2412

# and we haven't already been marked as an ancestor

2412

# and we haven't already been marked as an ancestor

2413

ancestors.add(n) # Mark as ancestor

2413

ancestors.add(n) # Mark as ancestor

2414

# Add non-nullid parents to list of nodes to tag.

2414

# Add non-nullid parents to list of nodes to tag.

2415

nodestotag.update(

2415

nodestotag.update(

2416

[p for p in self.parents(n) if p != self.nullid]

2416

[p for p in self.parents(n) if p != self.nullid]

2417

)

2417

)

2418

elif n in heads: # We've seen it before, is it a fake head?

2418

elif n in heads: # We've seen it before, is it a fake head?

2419

# So it is, real heads should not be the ancestors of

2419

# So it is, real heads should not be the ancestors of

2420

# any other heads.

2420

# any other heads.

2421

heads.pop(n)

2421

heads.pop(n)

2422

if not ancestors:

2422

if not ancestors:

2423

return nonodes

2423

return nonodes

2424

# Now that we have our set of ancestors, we want to remove any

2424

# Now that we have our set of ancestors, we want to remove any

2425

# roots that are not ancestors.

2425

# roots that are not ancestors.

2426

2427

# If one of the roots was nullid, everything is included anyway.

2427

# If one of the roots was nullid, everything is included anyway.

2428

if lowestrev > nullrev:

2428

if lowestrev > nullrev:

2429

# But, since we weren't, let's recompute the lowest rev to not

2429

# But, since we weren't, let's recompute the lowest rev to not

2430

# include roots that aren't ancestors.

2430

# include roots that aren't ancestors.

2431

2432

# Filter out roots that aren't ancestors of heads

2432

# Filter out roots that aren't ancestors of heads

2433

roots = [root for root in roots if root in ancestors]

2433

roots = [root for root in roots if root in ancestors]

2434

# Recompute the lowest revision

2434

# Recompute the lowest revision

2435

if roots:

2435

if roots:

2436

lowestrev = min([self.rev(root) for root in roots])

2436

lowestrev = min([self.rev(root) for root in roots])

2437

else:

2437

else:

2438

# No more roots? Return empty list

2438

# No more roots? Return empty list

2439

return nonodes

2439

return nonodes

2440

else:

2440

else:

2441

# We are descending from nullid, and don't need to care about

2441

# We are descending from nullid, and don't need to care about

2442

# any other roots.

2442

# any other roots.

2443

lowestrev = nullrev

2443

lowestrev = nullrev

2444

roots = [self.nullid]

2444

roots = [self.nullid]

2445

# Transform our roots list into a set.

2445

# Transform our roots list into a set.

2446

descendants = set(roots)

2446

descendants = set(roots)

2447

# Also, keep the original roots so we can filter out roots that aren't

2447

# Also, keep the original roots so we can filter out roots that aren't

2448

# 'real' roots (i.e. are descended from other roots).

2448

# 'real' roots (i.e. are descended from other roots).

2449

roots = descendants.copy()

2449

roots = descendants.copy()

2450

# Our topologically sorted list of output nodes.

2450

# Our topologically sorted list of output nodes.

2451

orderedout = []

2451

orderedout = []

2452

# Don't start at nullid since we don't want nullid in our output list,

2452

# Don't start at nullid since we don't want nullid in our output list,

2453

# and if nullid shows up in descendants, empty parents will look like

2453

# and if nullid shows up in descendants, empty parents will look like

2454

# they're descendants.

2454

# they're descendants.

2455

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

2455

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

2456

n = self.node(r)

2456

n = self.node(r)

2457

isdescendant = False

2457

isdescendant = False

2458

if lowestrev == nullrev: # Everybody is a descendant of nullid

2458

if lowestrev == nullrev: # Everybody is a descendant of nullid

2459

isdescendant = True

2459

isdescendant = True

2460

elif n in descendants:

2460

elif n in descendants:

2461

# n is already a descendant

2461

# n is already a descendant

2462

isdescendant = True

2462

isdescendant = True

2463

# This check only needs to be done here because all the roots

2463

# This check only needs to be done here because all the roots

2464

# will start being marked is descendants before the loop.

2464

# will start being marked is descendants before the loop.

2465

if n in roots:

2465

if n in roots:

2466

# If n was a root, check if it's a 'real' root.

2466

# If n was a root, check if it's a 'real' root.

2467

p = tuple(self.parents(n))

2467

p = tuple(self.parents(n))

2468

# If any of its parents are descendants, it's not a root.

2468

# If any of its parents are descendants, it's not a root.

2469

if (p[0] in descendants) or (p[1] in descendants):

2469

if (p[0] in descendants) or (p[1] in descendants):

2470

roots.remove(n)

2470

roots.remove(n)

2471

else:

2471

else:

2472

p = tuple(self.parents(n))

2472

p = tuple(self.parents(n))

2473

# A node is a descendant if either of its parents are

2473

# A node is a descendant if either of its parents are

2474

# descendants. (We seeded the dependents list with the roots

2474

# descendants. (We seeded the dependents list with the roots

2475

# up there, remember?)

2475

# up there, remember?)

2476

if (p[0] in descendants) or (p[1] in descendants):

2476

if (p[0] in descendants) or (p[1] in descendants):

2477

descendants.add(n)

2477

descendants.add(n)

2478

isdescendant = True

2478

isdescendant = True

2479

if isdescendant and ((ancestors is None) or (n in ancestors)):

2479

if isdescendant and ((ancestors is None) or (n in ancestors)):

2480

# Only include nodes that are both descendants and ancestors.

2480

# Only include nodes that are both descendants and ancestors.

2481

orderedout.append(n)

2481

orderedout.append(n)

2482

if (ancestors is not None) and (n in heads):

2482

if (ancestors is not None) and (n in heads):

2483

# We're trying to figure out which heads are reachable

2483

# We're trying to figure out which heads are reachable

2484

# from roots.

2484

# from roots.

2485

# Mark this head as having been reached

2485

# Mark this head as having been reached

2486

heads[n] = True

2486

heads[n] = True

2487

elif ancestors is None:

2487

elif ancestors is None:

2488

# Otherwise, we're trying to discover the heads.

2488

# Otherwise, we're trying to discover the heads.

2489

# Assume this is a head because if it isn't, the next step

2489

# Assume this is a head because if it isn't, the next step

2490

# will eventually remove it.

2490

# will eventually remove it.

2491

heads[n] = True

2491

heads[n] = True

2492

# But, obviously its parents aren't.

2492

# But, obviously its parents aren't.

2493

for p in self.parents(n):

2493

for p in self.parents(n):

2494

heads.pop(p, None)

2494

heads.pop(p, None)

2495

heads = [head for head, flag in heads.items() if flag]

2495

heads = [head for head, flag in heads.items() if flag]

2496

roots = list(roots)

2496

roots = list(roots)

2497

assert orderedout

2497

assert orderedout

2498

assert roots

2498

assert roots

2499

assert heads

2499

assert heads

2500

return (orderedout, roots, heads)

2500

return (orderedout, roots, heads)

2501

2502

def headrevs(self, revs=None, stop_rev=None):

2502

def headrevs(self, revs=None, stop_rev=None):

2503

if revs is None:

2503

if revs is None:

2504

return self.index.headrevs(None, stop_rev)

2504

return self.index.headrevs(None, stop_rev)

2505

if rustdagop is not None and self.index.rust_ext_compat:

2505

if rustdagop is not None and self.index.rust_ext_compat:

2506

return rustdagop.headrevs(self.index, revs)

2506

return rustdagop.headrevs(self.index, revs)

2507

return dagop.headrevs(revs, self._uncheckedparentrevs)

2507

return dagop.headrevs(revs, self._uncheckedparentrevs)

2508

2509

def headrevsdiff(self, start, stop):

2509

def headrevsdiff(self, start, stop):

2510

try:

2510

try:

2511

return self.index.headrevsdiff(

2511

return self.index.headrevsdiff(

2512

start, stop

2512

start, stop

2513

) # pytype: disable=attribute-error

2513

) # pytype: disable=attribute-error

2514

except AttributeError:

2514

except AttributeError:

2515

return dagop.headrevsdiff(self._uncheckedparentrevs, start, stop)

2515

return dagop.headrevsdiff(self._uncheckedparentrevs, start, stop)

2516

2517

def computephases(self, roots):

2517

def computephases(self, roots):

2518

return self.index.computephasesmapsets(

2518

return self.index.computephasesmapsets(

2519

roots

2519

roots

2520

) # pytype: disable=attribute-error

2520

) # pytype: disable=attribute-error

2521

2522

def _head_node_ids(self):

2522

def _head_node_ids(self):

2523

try:

2523

try:

2524

return self.index.head_node_ids() # pytype: disable=attribute-error

2524

return self.index.head_node_ids() # pytype: disable=attribute-error

2525

except AttributeError:

2525

except AttributeError:

2526

return [self.node(r) for r in self.headrevs()]

2526

return [self.node(r) for r in self.headrevs()]

2527

2528

def heads(self, start=None, stop=None):

2528

def heads(self, start=None, stop=None):

2529

"""return the list of all nodes that have no children

2529

"""return the list of all nodes that have no children

2530

2531

if start is specified, only heads that are descendants of

2531

if start is specified, only heads that are descendants of

2532

start will be returned

2532

start will be returned

2533

if stop is specified, it will consider all the revs from stop

2533

if stop is specified, it will consider all the revs from stop

2534

as if they had no children

2534

as if they had no children

2535

"""

2535

"""

2536

if start is None and stop is None:

2536

if start is None and stop is None:

2537

if not len(self):

2537

if not len(self):

2538

return [self.nullid]

2538

return [self.nullid]

2539

return self._head_node_ids()

2539

return self._head_node_ids()

2540

if start is None:

2540

if start is None:

2541

start = nullrev

2541

start = nullrev

2542

else:

2542

else:

2543

start = self.rev(start)

2543

start = self.rev(start)

2544

2545

stoprevs = {self.rev(n) for n in stop or []}

2545

stoprevs = {self.rev(n) for n in stop or []}

2546

2547

revs = dagop.headrevssubset(

2547

revs = dagop.headrevssubset(

2548

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

2548

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

2549

)

2549

)

2550

2551

return [self.node(rev) for rev in revs]

2551

return [self.node(rev) for rev in revs]

2552

2553

def diffheads(self, start, stop):

2553

def diffheads(self, start, stop):

2554

"""return the nodes that make up the difference between

2554

"""return the nodes that make up the difference between

2555

heads of revs before `start` and heads of revs before `stop`"""

2555

heads of revs before `start` and heads of revs before `stop`"""

2556

removed, added = self.headrevsdiff(start, stop)

2556

removed, added = self.headrevsdiff(start, stop)

2557

return [self.node(r) for r in removed], [self.node(r) for r in added]

2557

return [self.node(r) for r in removed], [self.node(r) for r in added]

2558

2559

def children(self, node):

2559

def children(self, node):

2560

"""find the children of a given node"""

2560

"""find the children of a given node"""

2561

c = []

2561

c = []

2562

p = self.rev(node)

2562

p = self.rev(node)

2563

for r in self.revs(start=p + 1):

2563

for r in self.revs(start=p + 1):

2564

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

2564

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

2565

if prevs:

2565

if prevs:

2566

for pr in prevs:

2566

for pr in prevs:

2567

if pr == p:

2567

if pr == p:

2568

c.append(self.node(r))

2568

c.append(self.node(r))

2569

elif p == nullrev:

2569

elif p == nullrev:

2570

c.append(self.node(r))

2570

c.append(self.node(r))

2571

return c

2571

return c

2572

2573

def commonancestorsheads(self, a, b):

2573

def commonancestorsheads(self, a, b):

2574

"""calculate all the heads of the common ancestors of nodes a and b"""

2574

"""calculate all the heads of the common ancestors of nodes a and b"""

2575

a, b = self.rev(a), self.rev(b)

2575

a, b = self.rev(a), self.rev(b)

2576

ancs = self._commonancestorsheads(a, b)

2576

ancs = self._commonancestorsheads(a, b)

2577

return pycompat.maplist(self.node, ancs)

2577

return pycompat.maplist(self.node, ancs)

2578

2579

def _commonancestorsheads(self, *revs):

2579

def _commonancestorsheads(self, *revs):

2580

"""calculate all the heads of the common ancestors of revs"""

2580

"""calculate all the heads of the common ancestors of revs"""

2581

try:

2581

try:

2582

ancs = self.index.commonancestorsheads(

2582

ancs = self.index.commonancestorsheads(

2583

*revs

2583

*revs

2584

) # pytype: disable=attribute-error

2584

) # pytype: disable=attribute-error

2585

except (AttributeError, OverflowError): # C implementation failed

2585

except (AttributeError, OverflowError): # C implementation failed

2586

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

2586

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

2587

return ancs

2587

return ancs

2588

2589

def isancestor(self, a, b):

2589

def isancestor(self, a, b):

2590

"""return True if node a is an ancestor of node b

2590

"""return True if node a is an ancestor of node b

2591

2592

A revision is considered an ancestor of itself."""

2592

A revision is considered an ancestor of itself."""

2593

a, b = self.rev(a), self.rev(b)

2593

a, b = self.rev(a), self.rev(b)

2594

return self.isancestorrev(a, b)

2594

return self.isancestorrev(a, b)

2595

2596

def isancestorrev(self, a, b):

2596

def isancestorrev(self, a, b):

2597

"""return True if revision a is an ancestor of revision b

2597

"""return True if revision a is an ancestor of revision b

2598

2599

A revision is considered an ancestor of itself.

2599

A revision is considered an ancestor of itself.

2600

2601

The implementation of this is trivial but the use of

2601

The implementation of this is trivial but the use of

2602

reachableroots is not."""

2602

reachableroots is not."""

2603

if a == nullrev:

2603

if a == nullrev:

2604

return True

2604

return True

2605

elif a == b:

2605

elif a == b:

2606

return True

2606

return True

2607

elif a > b:

2607

elif a > b:

2608

return False

2608

return False

2609

return bool(self.reachableroots(a, [b], [a], includepath=False))

2609

return bool(self.reachableroots(a, [b], [a], includepath=False))

2610

2611

def reachableroots(self, minroot, heads, roots, includepath=False):

2611

def reachableroots(self, minroot, heads, roots, includepath=False):

2612

"""return (heads(::(<roots> and <roots>::<heads>)))

2612

"""return (heads(::(<roots> and <roots>::<heads>)))

2613

2614

If includepath is True, return (<roots>::<heads>)."""

2614

If includepath is True, return (<roots>::<heads>)."""

2615

try:

2615

try:

2616

return self.index.reachableroots2(

2616

return self.index.reachableroots2(

2617

minroot, heads, roots, includepath

2617

minroot, heads, roots, includepath

2618

) # pytype: disable=attribute-error

2618

) # pytype: disable=attribute-error

2619

except AttributeError:

2619

except AttributeError:

2620

return dagop._reachablerootspure(

2620

return dagop._reachablerootspure(

2621

self.parentrevs, minroot, roots, heads, includepath

2621

self.parentrevs, minroot, roots, heads, includepath

2622

)

2622

)

2623

2624

def ancestor(self, a, b):

2624

def ancestor(self, a, b):

2625

"""calculate the "best" common ancestor of nodes a and b"""

2625

"""calculate the "best" common ancestor of nodes a and b"""

2626

2627

a, b = self.rev(a), self.rev(b)

2627

a, b = self.rev(a), self.rev(b)

2628

try:

2628

try:

2629

ancs = self.index.ancestors(a, b) # pytype: disable=attribute-error

2629

ancs = self.index.ancestors(a, b) # pytype: disable=attribute-error

2630

except (AttributeError, OverflowError):

2630

except (AttributeError, OverflowError):

2631

ancs = ancestor.ancestors(self.parentrevs, a, b)

2631

ancs = ancestor.ancestors(self.parentrevs, a, b)

2632

if ancs:

2632

if ancs:

2633

# choose a consistent winner when there's a tie

2633

# choose a consistent winner when there's a tie

2634

return min(map(self.node, ancs))

2634

return min(map(self.node, ancs))

2635

return self.nullid

2635

return self.nullid

2636

2637

def _match(self, id):

2637

def _match(self, id):

2638

if isinstance(id, int):

2638

if isinstance(id, int):

2639

# rev

2639

# rev

2640

return self.node(id)

2640

return self.node(id)

2641

if len(id) == self.nodeconstants.nodelen:

2641

if len(id) == self.nodeconstants.nodelen:

2642

# possibly a binary node

2642

# possibly a binary node

2643

# odds of a binary node being all hex in ASCII are 1 in 10**25

2643

# odds of a binary node being all hex in ASCII are 1 in 10**25

2644

try:

2644

try:

2645

node = id

2645

node = id

2646

self.rev(node) # quick search the index

2646

self.rev(node) # quick search the index

2647

return node

2647

return node

2648

except error.LookupError:

2648

except error.LookupError:

2649

pass # may be partial hex id

2649

pass # may be partial hex id

2650

try:

2650

try:

2651

# str(rev)

2651

# str(rev)

2652

rev = int(id)

2652

rev = int(id)

2653

if b"%d" % rev != id:

2653

if b"%d" % rev != id:

2654

raise ValueError

2654

raise ValueError

2655

if rev < 0:

2655

if rev < 0:

2656

rev = len(self) + rev

2656

rev = len(self) + rev

2657

if rev < 0 or rev >= len(self):

2657

if rev < 0 or rev >= len(self):

2658

raise ValueError

2658

raise ValueError

2659

return self.node(rev)

2659

return self.node(rev)

2660

except (ValueError, OverflowError):

2660

except (ValueError, OverflowError):

2661

pass

2661

pass

2662

if len(id) == 2 * self.nodeconstants.nodelen:

2662

if len(id) == 2 * self.nodeconstants.nodelen:

2663

try:

2663

try:

2664

# a full hex nodeid?

2664

# a full hex nodeid?

2665

node = bin(id)

2665

node = bin(id)

2666

self.rev(node)

2666

self.rev(node)

2667

return node

2667

return node

2668

except (binascii.Error, error.LookupError):

2668

except (binascii.Error, error.LookupError):

2669

pass

2669

pass

2670

2671

def _partialmatch(self, id):

2671

def _partialmatch(self, id):

2672

# we don't care wdirfilenodeids as they should be always full hash

2672

# we don't care wdirfilenodeids as they should be always full hash

2673

maybewdir = self.nodeconstants.wdirhex.startswith(id)

2673

maybewdir = self.nodeconstants.wdirhex.startswith(id)

2674

ambiguous = False

2674

ambiguous = False

2675

try:

2675

try:

2676

partial = self.index.partialmatch(

2676

partial = self.index.partialmatch(

2677

id

2677

id

2678

) # pytype: disable=attribute-error

2678

) # pytype: disable=attribute-error

2679

if partial and self.hasnode(partial):

2679

if partial and self.hasnode(partial):

2680

if maybewdir:

2680

if maybewdir:

2681

# single 'ff...' match in radix tree, ambiguous with wdir

2681

# single 'ff...' match in radix tree, ambiguous with wdir

2682

ambiguous = True

2682

ambiguous = True

2683

else:

2683

else:

2684

return partial

2684

return partial

2685

elif maybewdir:

2685

elif maybewdir:

2686

# no 'ff...' match in radix tree, wdir identified

2686

# no 'ff...' match in radix tree, wdir identified

2687

raise error.WdirUnsupported

2687

raise error.WdirUnsupported

2688

else:

2688

else:

2689

return None

2689

return None

2690

except error.RevlogError:

2690

except error.RevlogError:

2691

# parsers.c radix tree lookup gave multiple matches

2691

# parsers.c radix tree lookup gave multiple matches

2692

# fast path: for unfiltered changelog, radix tree is accurate

2692

# fast path: for unfiltered changelog, radix tree is accurate

2693

if not getattr(self, 'filteredrevs', None):

2693

if not getattr(self, 'filteredrevs', None):

2694

ambiguous = True

2694

ambiguous = True

2695

# fall through to slow path that filters hidden revisions

2695

# fall through to slow path that filters hidden revisions

2696

except (AttributeError, ValueError):

2696

except (AttributeError, ValueError):

2697

# we are pure python, or key is not hex

2697

# we are pure python, or key is not hex

2698

pass

2698

pass

2699

if ambiguous:

2699

if ambiguous:

2700

raise error.AmbiguousPrefixLookupError(

2700

raise error.AmbiguousPrefixLookupError(

2701

id, self.display_id, _(b'ambiguous identifier')

2701

id, self.display_id, _(b'ambiguous identifier')

2702

)

2702

)

2703

2704

if id in self._pcache:

2704

if id in self._pcache:

2705

return self._pcache[id]

2705

return self._pcache[id]

2706

2707

if len(id) <= 40:

2707

if len(id) <= 40:

2708

# hex(node)[:...]

2708

# hex(node)[:...]

2709

l = len(id) // 2 * 2 # grab an even number of digits

2709

l = len(id) // 2 * 2 # grab an even number of digits

2710

try:

2710

try:

2711

# we're dropping the last digit, so let's check that it's hex,

2711

# we're dropping the last digit, so let's check that it's hex,

2712

# to avoid the expensive computation below if it's not

2712

# to avoid the expensive computation below if it's not

2713

if len(id) % 2 > 0:

2713

if len(id) % 2 > 0:

2714

if not (id[-1] in hexdigits):

2714

if not (id[-1] in hexdigits):

2715

return None

2715

return None

2716

prefix = bin(id[:l])

2716

prefix = bin(id[:l])

2717

except binascii.Error:

2717

except binascii.Error:

2718

pass

2718

pass

2719

else:

2719

else:

2720

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

2720

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

2721

nl = [

2721

nl = [

2722

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

2722

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

2723

]

2723

]

2724

if self.nodeconstants.nullhex.startswith(id):

2724

if self.nodeconstants.nullhex.startswith(id):

2725

nl.append(self.nullid)

2725

nl.append(self.nullid)

2726

if len(nl) > 0:

2726

if len(nl) > 0:

2727

if len(nl) == 1 and not maybewdir:

2727

if len(nl) == 1 and not maybewdir:

2728

self._pcache[id] = nl[0]

2728

self._pcache[id] = nl[0]

2729

return nl[0]

2729

return nl[0]

2730

raise error.AmbiguousPrefixLookupError(

2730

raise error.AmbiguousPrefixLookupError(

2731

id, self.display_id, _(b'ambiguous identifier')

2731

id, self.display_id, _(b'ambiguous identifier')

2732

)

2732

)

2733

if maybewdir:

2733

if maybewdir:

2734

raise error.WdirUnsupported

2734

raise error.WdirUnsupported

2735

return None

2735

return None

2736

2737

def lookup(self, id):

2737

def lookup(self, id):

2738

"""locate a node based on:

2738

"""locate a node based on:

2739

- revision number or str(revision number)

2739

- revision number or str(revision number)

2740

- nodeid or subset of hex nodeid

2740

- nodeid or subset of hex nodeid

2741

"""

2741

"""

2742

n = self._match(id)

2742

n = self._match(id)

2743

if n is not None:

2743

if n is not None:

2744

return n

2744

return n

2745

n = self._partialmatch(id)

2745

n = self._partialmatch(id)

2746

if n:

2746

if n:

2747

return n

2747

return n

2748

2749

raise error.LookupError(id, self.display_id, _(b'no match found'))

2749

raise error.LookupError(id, self.display_id, _(b'no match found'))

2750

2751

def shortest(self, node, minlength=1):

2751

def shortest(self, node, minlength=1):

2752

"""Find the shortest unambiguous prefix that matches node."""

2752

"""Find the shortest unambiguous prefix that matches node."""

2753

2754

def isvalid(prefix):

2754

def isvalid(prefix):

2755

try:

2755

try:

2756

matchednode = self._partialmatch(prefix)

2756

matchednode = self._partialmatch(prefix)

2757

except error.AmbiguousPrefixLookupError:

2757

except error.AmbiguousPrefixLookupError:

2758

return False

2758

return False

2759

except error.WdirUnsupported:

2759

except error.WdirUnsupported:

2760

# single 'ff...' match

2760

# single 'ff...' match

2761

return True

2761

return True

2762

if matchednode is None:

2762

if matchednode is None:

2763

raise error.LookupError(node, self.display_id, _(b'no node'))

2763

raise error.LookupError(node, self.display_id, _(b'no node'))

2764

return True

2764

return True

2765

2766

def maybewdir(prefix):

2766

def maybewdir(prefix):

2767

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

2767

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

2768

2769

hexnode = hex(node)

2769

hexnode = hex(node)

2770

2771

def disambiguate(hexnode, minlength):

2771

def disambiguate(hexnode, minlength):

2772

"""Disambiguate against wdirid."""

2772

"""Disambiguate against wdirid."""

2773

for length in range(minlength, len(hexnode) + 1):

2773

for length in range(minlength, len(hexnode) + 1):

2774

prefix = hexnode[:length]

2774

prefix = hexnode[:length]

2775

if not maybewdir(prefix):

2775

if not maybewdir(prefix):

2776

return prefix

2776

return prefix

2777

2778

if not getattr(self, 'filteredrevs', None):

2778

if not getattr(self, 'filteredrevs', None):

2779

try:

2779

try:

2780

shortest = self.index.shortest(

2780

shortest = self.index.shortest(

2781

node

2781

node

2782

) # pytype: disable=attribute-error

2782

) # pytype: disable=attribute-error

2783

length = max(shortest, minlength)

2783

length = max(shortest, minlength)

2784

return disambiguate(hexnode, length)

2784

return disambiguate(hexnode, length)

2785

except error.RevlogError:

2785

except error.RevlogError:

2786

if node != self.nodeconstants.wdirid:

2786

if node != self.nodeconstants.wdirid:

2787

raise error.LookupError(

2787

raise error.LookupError(

2788

node, self.display_id, _(b'no node')

2788

node, self.display_id, _(b'no node')

2789

)

2789

)

2790

except AttributeError:

2790

except AttributeError:

2791

# Fall through to pure code

2791

# Fall through to pure code

2792

pass

2792

pass

2793

2794

if node == self.nodeconstants.wdirid:

2794

if node == self.nodeconstants.wdirid:

2795

for length in range(minlength, len(hexnode) + 1):

2795

for length in range(minlength, len(hexnode) + 1):

2796

prefix = hexnode[:length]

2796

prefix = hexnode[:length]

2797

if isvalid(prefix):

2797

if isvalid(prefix):

2798

return prefix

2798

return prefix

2799

2800

for length in range(minlength, len(hexnode) + 1):

2800

for length in range(minlength, len(hexnode) + 1):

2801

prefix = hexnode[:length]

2801

prefix = hexnode[:length]

2802

if isvalid(prefix):

2802

if isvalid(prefix):

2803

return disambiguate(hexnode, length)

2803

return disambiguate(hexnode, length)

2804

2805

def cmp(self, node, text):

2805

def cmp(self, node, text):

2806

"""compare text with a given file revision

2806

"""compare text with a given file revision

2807

2808

returns True if text is different than what is stored.

2808

returns True if text is different than what is stored.

2809

"""

2809

"""

2810

p1, p2 = self.parents(node)

2810

p1, p2 = self.parents(node)

2811

return storageutil.hashrevisionsha1(text, p1, p2) != node

2811

return storageutil.hashrevisionsha1(text, p1, p2) != node

2812

2813

def deltaparent(self, rev):

2813

def deltaparent(self, rev):

2814

"""return deltaparent of the given revision"""

2814

"""return deltaparent of the given revision"""

2815

base = self.index[rev][3]

2815

base = self.index[rev][3]

2816

if base == rev:

2816

if base == rev:

2817

return nullrev

2817

return nullrev

2818

elif self.delta_config.general_delta:

2818

elif self.delta_config.general_delta:

2819

return base

2819

return base

2820

else:

2820

else:

2821

return rev - 1

2821

return rev - 1

2822

2823

def issnapshot(self, rev):

2823

def issnapshot(self, rev):

2824

"""tells whether rev is a snapshot"""

2824

"""tells whether rev is a snapshot"""

2825

ret = self._inner.issnapshot(rev)

2825

ret = self._inner.issnapshot(rev)

2826

self.issnapshot = self._inner.issnapshot

2826

self.issnapshot = self._inner.issnapshot

2827

return ret

2827

return ret

2828

2829

def snapshotdepth(self, rev):

2829

def snapshotdepth(self, rev):

2830

"""number of snapshot in the chain before this one"""

2830

"""number of snapshot in the chain before this one"""

2831

if not self.issnapshot(rev):

2831

if not self.issnapshot(rev):

2832

raise error.ProgrammingError(b'revision %d not a snapshot')

2832

raise error.ProgrammingError(b'revision %d not a snapshot')

2833

return len(self._inner._deltachain(rev)[0]) - 1

2833

return len(self._inner._deltachain(rev)[0]) - 1

2834

2835

def revdiff(self, rev1, rev2):

2835

def revdiff(self, rev1, rev2):

2836

"""return or calculate a delta between two revisions

2836

"""return or calculate a delta between two revisions

2837

2838

The delta calculated is in binary form and is intended to be written to

2838

The delta calculated is in binary form and is intended to be written to

2839

revlog data directly. So this function needs raw revision data.

2839

revlog data directly. So this function needs raw revision data.

2840

"""

2840

"""

2841

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2841

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2842

return bytes(self._inner._chunk(rev2))

2842

return bytes(self._inner._chunk(rev2))

2843

2844

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2844

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2845

2846

def revision(self, nodeorrev):

2846

def revision(self, nodeorrev):

2847

"""return an uncompressed revision of a given node or revision

2847

"""return an uncompressed revision of a given node or revision

2848

number.

2848

number.

2849

"""

2849

"""

2850

return self._revisiondata(nodeorrev)

2850

return self._revisiondata(nodeorrev)

2851

2852

def sidedata(self, nodeorrev):

2852

def sidedata(self, nodeorrev):

2853

"""a map of extra data related to the changeset but not part of the hash

2853

"""a map of extra data related to the changeset but not part of the hash

2854

2855

This function currently return a dictionary. However, more advanced

2855

This function currently return a dictionary. However, more advanced

2856

mapping object will likely be used in the future for a more

2856

mapping object will likely be used in the future for a more

2857

efficient/lazy code.

2857

efficient/lazy code.

2858

"""

2858

"""

2859

# deal with <nodeorrev> argument type

2859

# deal with <nodeorrev> argument type

2860

if isinstance(nodeorrev, int):

2860

if isinstance(nodeorrev, int):

2861

rev = nodeorrev

2861

rev = nodeorrev

2862

else:

2862

else:

2863

rev = self.rev(nodeorrev)

2863

rev = self.rev(nodeorrev)

2864

return self._sidedata(rev)

2864

return self._sidedata(rev)

2865

2866

def _rawtext(self, node, rev):

2866

def _rawtext(self, node, rev):

2867

"""return the possibly unvalidated rawtext for a revision

2867

"""return the possibly unvalidated rawtext for a revision

2868

2869

returns (rev, rawtext, validated)

2869

returns (rev, rawtext, validated)

2870

"""

2870

"""

2871

# Check if we have the entry in cache

2871

# Check if we have the entry in cache

2872

# The cache entry looks like (node, rev, rawtext)

2872

# The cache entry looks like (node, rev, rawtext)

2873

if self._inner._revisioncache:

2873

if self._inner._revisioncache:

2874

if self._inner._revisioncache[0] == node:

2874

if self._inner._revisioncache[0] == node:

2875

return (rev, self._inner._revisioncache[2], True)

2875

return (rev, self._inner._revisioncache[2], True)

2876

2877

if rev is None:

2877

if rev is None:

2878

rev = self.rev(node)

2878

rev = self.rev(node)

2879

2880

text = self._inner.raw_text(node, rev)

2880

text = self._inner.raw_text(node, rev)

2881

return (rev, text, False)

2881

return (rev, text, False)

2882

2883

def _revisiondata(self, nodeorrev, raw=False):

2883

def _revisiondata(self, nodeorrev, raw=False):

2884

# deal with <nodeorrev> argument type

2884

# deal with <nodeorrev> argument type

2885

if isinstance(nodeorrev, int):

2885

if isinstance(nodeorrev, int):

2886

rev = nodeorrev

2886

rev = nodeorrev

2887

node = self.node(rev)

2887

node = self.node(rev)

2888

else:

2888

else:

2889

node = nodeorrev

2889

node = nodeorrev

2890

rev = None

2890

rev = None

2891

2892

# fast path the special `nullid` rev

2892

# fast path the special `nullid` rev

2893

if node == self.nullid:

2893

if node == self.nullid:

2894

return b""

2894

return b""

2895

2896

# ``rawtext`` is the text as stored inside the revlog. Might be the

2896

# ``rawtext`` is the text as stored inside the revlog. Might be the

2897

# revision or might need to be processed to retrieve the revision.

2897

# revision or might need to be processed to retrieve the revision.

2898

rev, rawtext, validated = self._rawtext(node, rev)

2898

rev, rawtext, validated = self._rawtext(node, rev)

2899

2900

if raw and validated:

2900

if raw and validated:

2901

# if we don't want to process the raw text and that raw

2901

# if we don't want to process the raw text and that raw

2902

# text is cached, we can exit early.

2902

# text is cached, we can exit early.

2903

return rawtext

2903

return rawtext

2904

if rev is None:

2904

if rev is None:

2905

rev = self.rev(node)

2905

rev = self.rev(node)

2906

# the revlog's flag for this revision

2906

# the revlog's flag for this revision

2907

# (usually alter its state or content)

2907

# (usually alter its state or content)

2908

flags = self.flags(rev)

2908

flags = self.flags(rev)

2909

2910

if validated and flags == REVIDX_DEFAULT_FLAGS:

2910

if validated and flags == REVIDX_DEFAULT_FLAGS:

2911

# no extra flags set, no flag processor runs, text = rawtext

2911

# no extra flags set, no flag processor runs, text = rawtext

2912

return rawtext

2912

return rawtext

2913

2914

if raw:

2914

if raw:

2915

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2915

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2916

text = rawtext

2916

text = rawtext

2917

else:

2917

else:

2918

r = flagutil.processflagsread(self, rawtext, flags)

2918

r = flagutil.processflagsread(self, rawtext, flags)

2919

text, validatehash = r

2919

text, validatehash = r

2920

if validatehash:

2920

if validatehash:

2921

self.checkhash(text, node, rev=rev)

2921

self.checkhash(text, node, rev=rev)

2922

if not validated:

2922

if not validated:

2923

self._inner._revisioncache = (node, rev, rawtext)

2923

self._inner._revisioncache = (node, rev, rawtext)

2924

2925

return text

2925

return text

2926

2927

def _sidedata(self, rev):

2927

def _sidedata(self, rev):

2928

"""Return the sidedata for a given revision number."""

2928

"""Return the sidedata for a given revision number."""

2929

if self._sidedatafile is None:

2929

if self._sidedatafile is None:

2930

return {}

2930

return {}

2931

sidedata_end = None

2931

sidedata_end = None

2932

if self._docket is not None:

2932

if self._docket is not None:

2933

sidedata_end = self._docket.sidedata_end

2933

sidedata_end = self._docket.sidedata_end

2934

return self._inner.sidedata(rev, sidedata_end)

2934

return self._inner.sidedata(rev, sidedata_end)

2935

2936

def rawdata(self, nodeorrev):

2936

def rawdata(self, nodeorrev):

2937

"""return an uncompressed raw data of a given node or revision number."""

2937

"""return an uncompressed raw data of a given node or revision number."""

2938

return self._revisiondata(nodeorrev, raw=True)

2938

return self._revisiondata(nodeorrev, raw=True)

2939

2940

def hash(self, text, p1, p2):

2940

def hash(self, text, p1, p2):

2941

"""Compute a node hash.

2941

"""Compute a node hash.

2942

2943

Available as a function so that subclasses can replace the hash

2943

Available as a function so that subclasses can replace the hash

2944

as needed.

2944

as needed.

2945

"""

2945

"""

2946

return storageutil.hashrevisionsha1(text, p1, p2)

2946

return storageutil.hashrevisionsha1(text, p1, p2)

2947

2948

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2948

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2949

"""Check node hash integrity.

2949

"""Check node hash integrity.

2950

2951

Available as a function so that subclasses can extend hash mismatch

2951

Available as a function so that subclasses can extend hash mismatch

2952

behaviors as needed.

2952

behaviors as needed.

2953

"""

2953

"""

2954

try:

2954

try:

2955

if p1 is None and p2 is None:

2955

if p1 is None and p2 is None:

2956

p1, p2 = self.parents(node)

2956

p1, p2 = self.parents(node)

2957

if node != self.hash(text, p1, p2):

2957

if node != self.hash(text, p1, p2):

2958

# Clear the revision cache on hash failure. The revision cache

2958

# Clear the revision cache on hash failure. The revision cache

2959

# only stores the raw revision and clearing the cache does have

2959

# only stores the raw revision and clearing the cache does have

2960

# the side-effect that we won't have a cache hit when the raw

2960

# the side-effect that we won't have a cache hit when the raw

2961

# revision data is accessed. But this case should be rare and

2961

# revision data is accessed. But this case should be rare and

2962

# it is extra work to teach the cache about the hash

2962

# it is extra work to teach the cache about the hash

2963

# verification state.

2963

# verification state.

2964

if (

2964

if (

2965

self._inner._revisioncache

2965

self._inner._revisioncache

2966

and self._inner._revisioncache[0] == node

2966

and self._inner._revisioncache[0] == node

2967

):

2967

):

2968

self._inner._revisioncache = None

2968

self._inner._revisioncache = None

2969

2970

revornode = rev

2970

revornode = rev

2971

if revornode is None:

2971

if revornode is None:

2972

revornode = templatefilters.short(hex(node))

2972

revornode = templatefilters.short(hex(node))

2973

raise error.RevlogError(

2973

raise error.RevlogError(

2974

_(b"integrity check failed on %s:%s")

2974

_(b"integrity check failed on %s:%s")

2975

% (self.display_id, pycompat.bytestr(revornode))

2975

% (self.display_id, pycompat.bytestr(revornode))

2976

)

2976

)

2977

except error.RevlogError:

2977

except error.RevlogError:

2978

if self.feature_config.censorable and storageutil.iscensoredtext(

2978

if self.feature_config.censorable and storageutil.iscensoredtext(

2979

text

2979

text

2980

):

2980

):

2981

raise error.CensoredNodeError(self.display_id, node, text)

2981

raise error.CensoredNodeError(self.display_id, node, text)

2982

raise

2982

raise

2983

2984

@property

2984

@property

2985

def _split_index_file(self):

2985

def _split_index_file(self):

2986

"""the path where to expect the index of an ongoing splitting operation

2986

"""the path where to expect the index of an ongoing splitting operation

2987

2988

The file will only exist if a splitting operation is in progress, but

2988

The file will only exist if a splitting operation is in progress, but

2989

it is always expected at the same location."""

2989

it is always expected at the same location."""

2990

parts = self.radix.split(b'/')

2990

parts = self.radix.split(b'/')

2991

if len(parts) > 1:

2991

if len(parts) > 1:

2992

# adds a '-s' prefix to the ``data/` or `meta/` base

2992

# adds a '-s' prefix to the ``data/` or `meta/` base

2993

head = parts[0] + b'-s'

2993

head = parts[0] + b'-s'

2994

mids = parts[1:-1]

2994

mids = parts[1:-1]

2995

tail = parts[-1] + b'.i'

2995

tail = parts[-1] + b'.i'

2996

pieces = [head] + mids + [tail]

2996

pieces = [head] + mids + [tail]

2997

return b'/'.join(pieces)

2997

return b'/'.join(pieces)

2998

else:

2998

else:

2999

# the revlog is stored at the root of the store (changelog or

2999

# the revlog is stored at the root of the store (changelog or

3000

# manifest), no risk of collision.

3000

# manifest), no risk of collision.

3001

return self.radix + b'.i.s'

3001

return self.radix + b'.i.s'

3002

3003

def _enforceinlinesize(self, tr):

3003

def _enforceinlinesize(self, tr):

3004

"""Check if the revlog is too big for inline and convert if so.

3004

"""Check if the revlog is too big for inline and convert if so.

3005

3006

This should be called after revisions are added to the revlog. If the

3006

This should be called after revisions are added to the revlog. If the

3007

revlog has grown too large to be an inline revlog, it will convert it

3007

revlog has grown too large to be an inline revlog, it will convert it

3008

to use multiple index and data files.

3008

to use multiple index and data files.

3009

"""

3009

"""

3010

tiprev = len(self) - 1

3010

tiprev = len(self) - 1

3011

total_size = self.start(tiprev) + self.length(tiprev)

3011

total_size = self.start(tiprev) + self.length(tiprev)

3012

if not self._inline or (self._may_inline and total_size < _maxinline):

3012

if not self._inline or (self._may_inline and total_size < _maxinline):

3013

return

3013

return

3014

3015

if self._docket is not None:

3015

if self._docket is not None:

3016

msg = b"inline revlog should not have a docket"

3016

msg = b"inline revlog should not have a docket"

3017

raise error.ProgrammingError(msg)

3017

raise error.ProgrammingError(msg)

3018

3019

# In the common case, we enforce inline size because the revlog has

3019

# In the common case, we enforce inline size because the revlog has

3020

# been appened too. And in such case, it must have an initial offset

3020

# been appened too. And in such case, it must have an initial offset

3021

# recorded in the transaction.

3021

# recorded in the transaction.

3022

troffset = tr.findoffset(self._inner.canonical_index_file)

3022

troffset = tr.findoffset(self._inner.canonical_index_file)

3023

pre_touched = troffset is not None

3023

pre_touched = troffset is not None

3024

if not pre_touched and self.target[0] != KIND_CHANGELOG:

3024

if not pre_touched and self.target[0] != KIND_CHANGELOG:

3025

raise error.RevlogError(

3025

raise error.RevlogError(

3026

_(b"%s not found in the transaction") % self._indexfile

3026

_(b"%s not found in the transaction") % self._indexfile

3027

)

3027

)

3028

3029

tr.addbackup(self._inner.canonical_index_file, for_offset=pre_touched)

3029

tr.addbackup(self._inner.canonical_index_file, for_offset=pre_touched)

3030

tr.add(self._datafile, 0)

3030

tr.add(self._datafile, 0)

3031

3032

new_index_file_path = None

3032

new_index_file_path = None

3033

old_index_file_path = self._indexfile

3033

old_index_file_path = self._indexfile

3034

new_index_file_path = self._split_index_file

3034

new_index_file_path = self._split_index_file

3035

opener = self.opener

3035

opener = self.opener

3036

weak_self = weakref.ref(self)

3036

weak_self = weakref.ref(self)

3037

3038

# the "split" index replace the real index when the transaction is

3038

# the "split" index replace the real index when the transaction is

3039

# finalized

3039

# finalized

3040

def finalize_callback(tr):

3040

def finalize_callback(tr):

3041

opener.rename(

3041

opener.rename(

3042

new_index_file_path,

3042

new_index_file_path,

3043

old_index_file_path,

3043

old_index_file_path,

3044

checkambig=True,

3044

checkambig=True,

3045

)

3045

)

3046

maybe_self = weak_self()

3046

maybe_self = weak_self()

3047

if maybe_self is not None:

3047

if maybe_self is not None:

3048

maybe_self._indexfile = old_index_file_path

3048

maybe_self._indexfile = old_index_file_path

3049

maybe_self._inner.index_file = maybe_self._indexfile

3049

maybe_self._inner.index_file = maybe_self._indexfile

3050

3051

def abort_callback(tr):

3051

def abort_callback(tr):

3052

maybe_self = weak_self()

3052

maybe_self = weak_self()

3053

if maybe_self is not None:

3053

if maybe_self is not None:

3054

maybe_self._indexfile = old_index_file_path

3054

maybe_self._indexfile = old_index_file_path

3055

maybe_self._inner.inline = True

3055

maybe_self._inner.inline = True

3056

maybe_self._inner.index_file = old_index_file_path

3056

maybe_self._inner.index_file = old_index_file_path

3057

3058

tr.registertmp(new_index_file_path)

3058

tr.registertmp(new_index_file_path)

3059

# we use 001 here to make this this happens after the finalisation of

3059

# we use 001 here to make this this happens after the finalisation of

3060

# pending changelog write (using 000). Otherwise the two finalizer

3060

# pending changelog write (using 000). Otherwise the two finalizer

3061

# would step over each other and delete the changelog.i file.

3061

# would step over each other and delete the changelog.i file.

3062

if self.target[1] is not None:

3062

if self.target[1] is not None:

3063

callback_id = b'001-revlog-split-%d-%s' % self.target

3063

callback_id = b'001-revlog-split-%d-%s' % self.target

3064

else:

3064

else:

3065

callback_id = b'001-revlog-split-%d' % self.target[0]

3065

callback_id = b'001-revlog-split-%d' % self.target[0]

3066

tr.addfinalize(callback_id, finalize_callback)

3066

tr.addfinalize(callback_id, finalize_callback)

3067

tr.addabort(callback_id, abort_callback)

3067

tr.addabort(callback_id, abort_callback)

3068

3069

self._format_flags &= ~FLAG_INLINE_DATA

3069

self._format_flags &= ~FLAG_INLINE_DATA

3070

self._inner.split_inline(

3070

self._inner.split_inline(

3071

tr,

3071

tr,

3072

self._format_flags | self._format_version,

3072

self._format_flags | self._format_version,

3073

new_index_file_path=new_index_file_path,

3073

new_index_file_path=new_index_file_path,

3074

)

3074

)

3075

3076

self._inline = False

3076

self._inline = False

3077

if new_index_file_path is not None:

3077

if new_index_file_path is not None:

3078

self._indexfile = new_index_file_path

3078

self._indexfile = new_index_file_path

3079

3080

nodemaputil.setup_persistent_nodemap(tr, self)

3080

nodemaputil.setup_persistent_nodemap(tr, self)

3081

3082

def _nodeduplicatecallback(self, transaction, node):

3082

def _nodeduplicatecallback(self, transaction, node):

3083

"""called when trying to add a node already stored."""

3083

"""called when trying to add a node already stored."""

3084

3085

@contextlib.contextmanager

3085

@contextlib.contextmanager

3086

def reading(self):

3086

def reading(self):

3087

with self._inner.reading():

3087

with self._inner.reading():

3088

yield

3088

yield

3089

3090

@contextlib.contextmanager

3090

@contextlib.contextmanager

3091

def _writing(self, transaction):

3091

def _writing(self, transaction):

3092

if self._trypending:

3092

if self._trypending:

3093

msg = b'try to write in a `trypending` revlog: %s'

3093

msg = b'try to write in a `trypending` revlog: %s'

3094

msg %= self.display_id

3094

msg %= self.display_id

3095

raise error.ProgrammingError(msg)

3095

raise error.ProgrammingError(msg)

3096

if self._inner.is_writing:

3096

if self._inner.is_writing:

3097

yield

3097

yield

3098

else:

3098

else:

3099

data_end = None

3099

data_end = None

3100

sidedata_end = None

3100

sidedata_end = None

3101

if self._docket is not None:

3101

if self._docket is not None:

3102

data_end = self._docket.data_end

3102

data_end = self._docket.data_end

3103

sidedata_end = self._docket.sidedata_end

3103

sidedata_end = self._docket.sidedata_end

3104

with self._inner.writing(

3104

with self._inner.writing(

3105

transaction,

3105

transaction,

3106

data_end=data_end,

3106

data_end=data_end,

3107

sidedata_end=sidedata_end,

3107

sidedata_end=sidedata_end,

3108

):

3108

):

3109

yield

3109

yield

3110

if self._docket is not None:

3110

if self._docket is not None:

3111

self._write_docket(transaction)

3111

self._write_docket(transaction)

3112

3113

@property

3113

@property

3114

def is_delaying(self):

3114

def is_delaying(self):

3115

return self._inner.is_delaying

3115

return self._inner.is_delaying

3116

3117

def _write_docket(self, transaction):

3117

def _write_docket(self, transaction):

3118

"""write the current docket on disk

3118

"""write the current docket on disk

3119

3120

Exist as a method to help changelog to implement transaction logic

3120

Exist as a method to help changelog to implement transaction logic

3121

3122

We could also imagine using the same transaction logic for all revlog

3122

We could also imagine using the same transaction logic for all revlog

3123

since docket are cheap."""

3123

since docket are cheap."""

3124

self._docket.write(transaction)

3124

self._docket.write(transaction)

3125

3126

def addrevision(

3126

def addrevision(

3127

self,

3127

self,

3128

text,

3128

text,

3129

transaction,

3129

transaction,

3130

link,

3130

link,

3131

p1,

3131

p1,

3132

p2,

3132

p2,

3133

cachedelta=None,

3133

cachedelta=None,

3134

node=None,

3134

node=None,

3135

flags=REVIDX_DEFAULT_FLAGS,

3135

flags=REVIDX_DEFAULT_FLAGS,

3136

deltacomputer=None,

3136

deltacomputer=None,

3137

sidedata=None,

3137

sidedata=None,

3138

):

3138

):

3139

"""add a revision to the log

3139

"""add a revision to the log

3140

3141

text - the revision data to add

3141

text - the revision data to add

3142

transaction - the transaction object used for rollback

3142

transaction - the transaction object used for rollback

3143

link - the linkrev data to add

3143

link - the linkrev data to add

3144

p1, p2 - the parent nodeids of the revision

3144

p1, p2 - the parent nodeids of the revision

3145

cachedelta - an optional precomputed delta

3145

cachedelta - an optional precomputed delta

3146

node - nodeid of revision; typically node is not specified, and it is

3146

node - nodeid of revision; typically node is not specified, and it is

3147

computed by default as hash(text, p1, p2), however subclasses might

3147

computed by default as hash(text, p1, p2), however subclasses might

3148

use different hashing method (and override checkhash() in such case)

3148

use different hashing method (and override checkhash() in such case)

3149

flags - the known flags to set on the revision

3149

flags - the known flags to set on the revision

3150

deltacomputer - an optional deltacomputer instance shared between

3150

deltacomputer - an optional deltacomputer instance shared between

3151

multiple calls

3151

multiple calls

3152

"""

3152

"""

3153

if link == nullrev:

3153

if link == nullrev:

3154

raise error.RevlogError(

3154

raise error.RevlogError(

3155

_(b"attempted to add linkrev -1 to %s") % self.display_id

3155

_(b"attempted to add linkrev -1 to %s") % self.display_id

3156

)

3156

)

3157

3158

if sidedata is None:

3158

if sidedata is None:

3159

sidedata = {}

3159

sidedata = {}

3160

elif sidedata and not self.feature_config.has_side_data:

3160

elif sidedata and not self.feature_config.has_side_data:

3161

raise error.ProgrammingError(

3161

raise error.ProgrammingError(

3162

_(b"trying to add sidedata to a revlog who don't support them")

3162

_(b"trying to add sidedata to a revlog who don't support them")

3163

)

3163

)

3164

3165

if flags:

3165

if flags:

3166

node = node or self.hash(text, p1, p2)

3166

node = node or self.hash(text, p1, p2)

3167

3168

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

3168

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

3169

3170

# If the flag processor modifies the revision data, ignore any provided

3170

# If the flag processor modifies the revision data, ignore any provided

3171

# cachedelta.

3171

# cachedelta.

3172

if rawtext != text:

3172

if rawtext != text:

3173

cachedelta = None

3173

cachedelta = None

3174

3175

if len(rawtext) > _maxentrysize:

3175

if len(rawtext) > _maxentrysize:

3176

raise error.RevlogError(

3176

raise error.RevlogError(

3177

_(

3177

_(

3178

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

3178

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

3179

)

3179

)

3180

% (self.display_id, len(rawtext))

3180

% (self.display_id, len(rawtext))

3181

)

3181

)

3182

3183

node = node or self.hash(rawtext, p1, p2)

3183

node = node or self.hash(rawtext, p1, p2)

3184

rev = self.index.get_rev(node)

3184

rev = self.index.get_rev(node)

3185

if rev is not None:

3185

if rev is not None:

3186

return rev

3186

return rev

3187

3188

if validatehash:

3188

if validatehash:

3189

self.checkhash(rawtext, node, p1=p1, p2=p2)

3189

self.checkhash(rawtext, node, p1=p1, p2=p2)

3190

3191

return self.addrawrevision(

3191

return self.addrawrevision(

3192

rawtext,

3192

rawtext,

3193

transaction,

3193

transaction,

3194

link,

3194

link,

3195

p1,

3195

p1,

3196

p2,

3196

p2,

3197

node,

3197

node,

3198

flags,

3198

flags,

3199

cachedelta=cachedelta,

3199

cachedelta=cachedelta,

3200

deltacomputer=deltacomputer,

3200

deltacomputer=deltacomputer,

3201

sidedata=sidedata,

3201

sidedata=sidedata,

3202

)

3202

)

3203

3204

def addrawrevision(

3204

def addrawrevision(

3205

self,

3205

self,

3206

rawtext,

3206

rawtext,

3207

transaction,

3207

transaction,

3208

link,

3208

link,

3209

p1,

3209

p1,

3210

p2,

3210

p2,

3211

node,

3211

node,

3212

flags,

3212

flags,

3213

cachedelta=None,

3213

cachedelta=None,

3214

deltacomputer=None,

3214

deltacomputer=None,

3215

sidedata=None,

3215

sidedata=None,

3216

):

3216

):

3217

"""add a raw revision with known flags, node and parents

3217

"""add a raw revision with known flags, node and parents

3218

useful when reusing a revision not stored in this revlog (ex: received

3218

useful when reusing a revision not stored in this revlog (ex: received

3219

over wire, or read from an external bundle).

3219

over wire, or read from an external bundle).

3220

"""

3220

"""

3221

with self._writing(transaction):

3221

with self._writing(transaction):

3222

return self._addrevision(

3222

return self._addrevision(

3223

node,

3223

node,

3224

rawtext,

3224

rawtext,

3225

transaction,

3225

transaction,

3226

link,

3226

link,

3227

p1,

3227

p1,

3228

p2,

3228

p2,

3229

flags,

3229

flags,

3230

cachedelta,

3230

cachedelta,

3231

deltacomputer=deltacomputer,

3231

deltacomputer=deltacomputer,

3232

sidedata=sidedata,

3232

sidedata=sidedata,

3233

)

3233

)

3234

3235

def compress(self, data: bytes) -> Tuple[bytes, bytes]:

3235

def compress(self, data: bytes) -> Tuple[bytes, bytes]:

3236

return self._inner.compress(data)

3236

return self._inner.compress(data)

3237

3238

def decompress(self, data):

3238

def decompress(self, data):

3239

return self._inner.decompress(data)

3239

return self._inner.decompress(data)

3240

3241

def _addrevision(

3241

def _addrevision(

3242

self,

3242

self,

3243

node,

3243

node,

3244

rawtext,

3244

rawtext,

3245

transaction,

3245

transaction,

3246

link,

3246

link,

3247

p1,

3247

p1,

3248

p2,

3248

p2,

3249

flags,

3249

flags,

3250

cachedelta,

3250

cachedelta,

3251

alwayscache=False,

3251

alwayscache=False,

3252

deltacomputer=None,

3252

deltacomputer=None,

3253

sidedata=None,

3253

sidedata=None,

3254

):

3254

):

3255

"""internal function to add revisions to the log

3255

"""internal function to add revisions to the log

3256

3257

see addrevision for argument descriptions.

3257

see addrevision for argument descriptions.

3258

3259

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

3259

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

3260

3261

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

3261

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

3262

be used.

3262

be used.

3263

3264

invariants:

3264

invariants:

3265

- rawtext is optional (can be None); if not set, cachedelta must be set.

3265

- rawtext is optional (can be None); if not set, cachedelta must be set.

3266

if both are set, they must correspond to each other.

3266

if both are set, they must correspond to each other.

3267

"""

3267

"""

3268

if node == self.nullid:

3268

if node == self.nullid:

3269

raise error.RevlogError(

3269

raise error.RevlogError(

3270

_(b"%s: attempt to add null revision") % self.display_id

3270

_(b"%s: attempt to add null revision") % self.display_id

3271

)

3271

)

3272

if (

3272

if (

3273

node == self.nodeconstants.wdirid

3273

node == self.nodeconstants.wdirid

3274

or node in self.nodeconstants.wdirfilenodeids

3274

or node in self.nodeconstants.wdirfilenodeids

3275

):

3275

):

3276

raise error.RevlogError(

3276

raise error.RevlogError(

3277

_(b"%s: attempt to add wdir revision") % self.display_id

3277

_(b"%s: attempt to add wdir revision") % self.display_id

3278

)

3278

)

3279

if not self._inner.is_writing:

3279

if not self._inner.is_writing:

3280

msg = b'adding revision outside `revlog._writing` context'

3280

msg = b'adding revision outside `revlog._writing` context'

3281

raise error.ProgrammingError(msg)

3281

raise error.ProgrammingError(msg)

3282

3283

btext = [rawtext]

3283

btext = [rawtext]

3284

3285

curr = len(self)

3285

curr = len(self)

3286

prev = curr - 1

3286

prev = curr - 1

3287

3288

offset = self._get_data_offset(prev)

3288

offset = self._get_data_offset(prev)

3289

3290

if self._concurrencychecker:

3290

if self._concurrencychecker:

3291

ifh, dfh, sdfh = self._inner._writinghandles

3291

ifh, dfh, sdfh = self._inner._writinghandles

3292

# XXX no checking for the sidedata file

3292

# XXX no checking for the sidedata file

3293

if self._inline:

3293

if self._inline:

3294

# offset is "as if" it were in the .d file, so we need to add on

3294

# offset is "as if" it were in the .d file, so we need to add on

3295

# the size of the entry metadata.

3295

# the size of the entry metadata.

3296

self._concurrencychecker(

3296

self._concurrencychecker(

3297

ifh, self._indexfile, offset + curr * self.index.entry_size

3297

ifh, self._indexfile, offset + curr * self.index.entry_size

3298

)

3298

)

3299

else:

3299

else:

3300

# Entries in the .i are a consistent size.

3300

# Entries in the .i are a consistent size.

3301

self._concurrencychecker(

3301

self._concurrencychecker(

3302

ifh, self._indexfile, curr * self.index.entry_size

3302

ifh, self._indexfile, curr * self.index.entry_size

3303

)

3303

)

3304

self._concurrencychecker(dfh, self._datafile, offset)

3304

self._concurrencychecker(dfh, self._datafile, offset)

3305

3306

p1r, p2r = self.rev(p1), self.rev(p2)

3306

p1r, p2r = self.rev(p1), self.rev(p2)

3307

3308

# full versions are inserted when the needed deltas

3308

# full versions are inserted when the needed deltas

3309

# become comparable to the uncompressed text

3309

# become comparable to the uncompressed text

3310

if rawtext is None:

3310

if rawtext is None:

3311

# need rawtext size, before changed by flag processors, which is

3311

# need rawtext size, before changed by flag processors, which is

3312

# the non-raw size. use revlog explicitly to avoid filelog's extra

3312

# the non-raw size. use revlog explicitly to avoid filelog's extra

3313

# logic that might remove metadata size.

3313

# logic that might remove metadata size.

3314

textlen = mdiff.patchedsize(

3314

textlen = mdiff.patchedsize(

3315

revlog.size(self, cachedelta[0]), cachedelta[1]

3315

revlog.size(self, cachedelta[0]), cachedelta[1]

3316

)

3316

)

3317

else:

3317

else:

3318

textlen = len(rawtext)

3318

textlen = len(rawtext)

3319

3320

if deltacomputer is None:

3320

if deltacomputer is None:

3321

write_debug = None

3321

write_debug = None

3322

if self.delta_config.debug_delta:

3322

if self.delta_config.debug_delta:

3323

write_debug = transaction._report

3323

write_debug = transaction._report

3324

deltacomputer = deltautil.deltacomputer(

3324

deltacomputer = deltautil.deltacomputer(

3325

self, write_debug=write_debug

3325

self, write_debug=write_debug

3326

)

3326

)

3327

3328

if cachedelta is not None and len(cachedelta) == 2:

3328

if cachedelta is not None and len(cachedelta) == 2:

3329

# If the cached delta has no information about how it should be

3329

# If the cached delta has no information about how it should be

3330

# reused, add the default reuse instruction according to the

3330

# reused, add the default reuse instruction according to the

3331

# revlog's configuration.

3331

# revlog's configuration.

3332

if (

3332

if (

3333

self.delta_config.general_delta

3333

self.delta_config.general_delta

3334

and self.delta_config.lazy_delta_base

3334

and self.delta_config.lazy_delta_base

3335

):

3335

):

3336

delta_base_reuse = DELTA_BASE_REUSE_TRY

3336

delta_base_reuse = DELTA_BASE_REUSE_TRY

3337

else:

3337

else:

3338

delta_base_reuse = DELTA_BASE_REUSE_NO

3338

delta_base_reuse = DELTA_BASE_REUSE_NO

3339

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

3339

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

3340

3341

revinfo = revlogutils.revisioninfo(

3341

revinfo = revlogutils.revisioninfo(

3342

node,

3342

node,

3343

p1,

3343

p1,

3344

p2,

3344

p2,

3345

btext,

3345

btext,

3346

textlen,

3346

textlen,

3347

cachedelta,

3347

cachedelta,

3348

flags,

3348

flags,

3349

)

3349

)

3350

3351

deltainfo = deltacomputer.finddeltainfo(revinfo)

3351

deltainfo = deltacomputer.finddeltainfo(revinfo)

3352

3353

compression_mode = COMP_MODE_INLINE

3353

compression_mode = COMP_MODE_INLINE

3354

if self._docket is not None:

3354

if self._docket is not None:

3355

default_comp = self._docket.default_compression_header

3355

default_comp = self._docket.default_compression_header

3356

r = deltautil.delta_compression(default_comp, deltainfo)

3356

r = deltautil.delta_compression(default_comp, deltainfo)

3357

compression_mode, deltainfo = r

3357

compression_mode, deltainfo = r

3358

3359

sidedata_compression_mode = COMP_MODE_INLINE

3359

sidedata_compression_mode = COMP_MODE_INLINE

3360

if sidedata and self.feature_config.has_side_data:

3360

if sidedata and self.feature_config.has_side_data:

3361

sidedata_compression_mode = COMP_MODE_PLAIN

3361

sidedata_compression_mode = COMP_MODE_PLAIN

3362

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

3362

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

3363

sidedata_offset = self._docket.sidedata_end

3363

sidedata_offset = self._docket.sidedata_end

3364

h, comp_sidedata = self._inner.compress(serialized_sidedata)

3364

h, comp_sidedata = self._inner.compress(serialized_sidedata)

3365

if (

3365

if (

3366

h != b'u'

3366

h != b'u'

3367

and comp_sidedata[0:1] != b'\0'

3367

and comp_sidedata[0:1] != b'\0'

3368

and len(comp_sidedata) < len(serialized_sidedata)

3368

and len(comp_sidedata) < len(serialized_sidedata)

3369

):

3369

):

3370

assert not h

3370

assert not h

3371

if (

3371

if (

3372

comp_sidedata[0:1]

3372

comp_sidedata[0:1]

3373

== self._docket.default_compression_header

3373

== self._docket.default_compression_header

3374

):

3374

):

3375

sidedata_compression_mode = COMP_MODE_DEFAULT

3375

sidedata_compression_mode = COMP_MODE_DEFAULT

3376

serialized_sidedata = comp_sidedata

3376

serialized_sidedata = comp_sidedata

3377

else:

3377

else:

3378

sidedata_compression_mode = COMP_MODE_INLINE

3378

sidedata_compression_mode = COMP_MODE_INLINE

3379

serialized_sidedata = comp_sidedata

3379

serialized_sidedata = comp_sidedata

3380

else:

3380

else:

3381

serialized_sidedata = b""

3381

serialized_sidedata = b""

3382

# Don't store the offset if the sidedata is empty, that way

3382

# Don't store the offset if the sidedata is empty, that way

3383

# we can easily detect empty sidedata and they will be no different

3383

# we can easily detect empty sidedata and they will be no different

3384

# than ones we manually add.

3384

# than ones we manually add.

3385

sidedata_offset = 0

3385

sidedata_offset = 0

3386

3387

rank = RANK_UNKNOWN

3387

rank = RANK_UNKNOWN

3388

if self.feature_config.compute_rank:

3388

if self.feature_config.compute_rank:

3389

if (p1r, p2r) == (nullrev, nullrev):

3389

if (p1r, p2r) == (nullrev, nullrev):

3390

rank = 1

3390

rank = 1

3391

elif p1r != nullrev and p2r == nullrev:

3391

elif p1r != nullrev and p2r == nullrev:

3392

rank = 1 + self.fast_rank(p1r)

3392

rank = 1 + self.fast_rank(p1r)

3393

elif p1r == nullrev and p2r != nullrev:

3393

elif p1r == nullrev and p2r != nullrev:

3394

rank = 1 + self.fast_rank(p2r)

3394

rank = 1 + self.fast_rank(p2r)

3395

else: # merge node

3395

else: # merge node

3396

if rustdagop is not None and self.index.rust_ext_compat:

3396

if rustdagop is not None and self.index.rust_ext_compat:

3397

rank = rustdagop.rank(self.index, p1r, p2r)

3397

rank = rustdagop.rank(self.index, p1r, p2r)

3398

else:

3398

else:

3399

pmin, pmax = sorted((p1r, p2r))

3399

pmin, pmax = sorted((p1r, p2r))

3400

rank = 1 + self.fast_rank(pmax)

3400

rank = 1 + self.fast_rank(pmax)

3401

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

3401

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

3402

3403

e = revlogutils.entry(

3403

e = revlogutils.entry(

3404

flags=flags,

3404

flags=flags,

3405

data_offset=offset,

3405

data_offset=offset,

3406

data_compressed_length=deltainfo.deltalen,

3406

data_compressed_length=deltainfo.deltalen,

3407

data_uncompressed_length=textlen,

3407

data_uncompressed_length=textlen,

3408

data_compression_mode=compression_mode,

3408

data_compression_mode=compression_mode,

3409

data_delta_base=deltainfo.base,

3409

data_delta_base=deltainfo.base,

3410

link_rev=link,

3410

link_rev=link,

3411

parent_rev_1=p1r,

3411

parent_rev_1=p1r,

3412

parent_rev_2=p2r,

3412

parent_rev_2=p2r,

3413

node_id=node,

3413

node_id=node,

3414

sidedata_offset=sidedata_offset,

3414

sidedata_offset=sidedata_offset,

3415

sidedata_compressed_length=len(serialized_sidedata),

3415

sidedata_compressed_length=len(serialized_sidedata),

3416

sidedata_compression_mode=sidedata_compression_mode,

3416

sidedata_compression_mode=sidedata_compression_mode,

3417

rank=rank,

3417

rank=rank,

3418

)

3418

)

3419

3420

self.index.append(e)

3420

self.index.append(e)

3421

entry = self.index.entry_binary(curr)

3421

entry = self.index.entry_binary(curr)

3422

if curr == 0 and self._docket is None:

3422

if curr == 0 and self._docket is None:

3423

header = self._format_flags | self._format_version

3423

header = self._format_flags | self._format_version

3424

header = self.index.pack_header(header)

3424

header = self.index.pack_header(header)

3425

entry = header + entry

3425

entry = header + entry

3426

self._writeentry(

3426

self._writeentry(

3427

transaction,

3427

transaction,

3428

entry,

3428

entry,

3429

deltainfo.data,

3429

deltainfo.data,

3430

link,

3430

link,

3431

offset,

3431

offset,

3432

serialized_sidedata,

3432

serialized_sidedata,

3433

sidedata_offset,

3433

sidedata_offset,

3434

)

3434

)

3435

3436

rawtext = btext[0]

3436

rawtext = btext[0]

3437

3438

if alwayscache and rawtext is None:

3438

if alwayscache and rawtext is None:

3439

rawtext = deltacomputer.buildtext(revinfo)

3439

rawtext = deltacomputer.buildtext(revinfo)

3440

3441

if type(rawtext) == bytes: # only accept immutable objects

3441

if type(rawtext) == bytes: # only accept immutable objects

3442

self._inner._revisioncache = (node, curr, rawtext)

3442

self._inner._revisioncache = (node, curr, rawtext)

3443

self._chainbasecache[curr] = deltainfo.chainbase

3443

self._chainbasecache[curr] = deltainfo.chainbase

3444

return curr

3444

return curr

3445

3446

def _get_data_offset(self, prev):

3446

def _get_data_offset(self, prev):

3447

"""Returns the current offset in the (in-transaction) data file.

3447

"""Returns the current offset in the (in-transaction) data file.

3448

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

3448

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

3449

file to store that information: since sidedata can be rewritten to the

3449

file to store that information: since sidedata can be rewritten to the

3450

end of the data file within a transaction, you can have cases where, for

3450

end of the data file within a transaction, you can have cases where, for

3451

example, rev `n` does not have sidedata while rev `n - 1` does, leading

3451

example, rev `n` does not have sidedata while rev `n - 1` does, leading

3452

to `n - 1`'s sidedata being written after `n`'s data.

3452

to `n - 1`'s sidedata being written after `n`'s data.

3453

3454

TODO cache this in a docket file before getting out of experimental."""

3454

TODO cache this in a docket file before getting out of experimental."""

3455

if self._docket is None:

3455

if self._docket is None:

3456

return self.end(prev)

3456

return self.end(prev)

3457

else:

3457

else:

3458

return self._docket.data_end

3458

return self._docket.data_end

3459

3460

def _writeentry(

3460

def _writeentry(

3461

self,

3461

self,

3462

transaction,

3462

transaction,

3463

entry,

3463

entry,

3464

data,

3464

data,

3465

link,

3465

link,

3466

offset,

3466

offset,

3467

sidedata,

3467

sidedata,

3468

sidedata_offset,

3468

sidedata_offset,

3469

):

3469

):

3470

# Files opened in a+ mode have inconsistent behavior on various

3470

# Files opened in a+ mode have inconsistent behavior on various

3471

# platforms. Windows requires that a file positioning call be made

3471

# platforms. Windows requires that a file positioning call be made

3472

# when the file handle transitions between reads and writes. See

3472

# when the file handle transitions between reads and writes. See

3473

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

3473

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

3474

# platforms, Python or the platform itself can be buggy. Some versions

3474

# platforms, Python or the platform itself can be buggy. Some versions

3475

# of Solaris have been observed to not append at the end of the file

3475

# of Solaris have been observed to not append at the end of the file

3476

# if the file was seeked to before the end. See issue4943 for more.

3476

# if the file was seeked to before the end. See issue4943 for more.

3477

#

3477

#

3478

# We work around this issue by inserting a seek() before writing.

3478

# We work around this issue by inserting a seek() before writing.

3479

# Note: This is likely not necessary on Python 3. However, because

3479

# Note: This is likely not necessary on Python 3. However, because

3480

# the file handle is reused for reads and may be seeked there, we need

3480

# the file handle is reused for reads and may be seeked there, we need

3481

# to be careful before changing this.

3481

# to be careful before changing this.

3482

index_end = data_end = sidedata_end = None

3482

index_end = data_end = sidedata_end = None

3483

if self._docket is not None:

3483

if self._docket is not None:

3484

index_end = self._docket.index_end

3484

index_end = self._docket.index_end

3485

data_end = self._docket.data_end

3485

data_end = self._docket.data_end

3486

sidedata_end = self._docket.sidedata_end

3486

sidedata_end = self._docket.sidedata_end

3487

3488

files_end = self._inner.write_entry(

3488

files_end = self._inner.write_entry(

3489

transaction,

3489

transaction,

3490

entry,

3490

entry,

3491

data,

3491

data,

3492

link,

3492

link,

3493

offset,

3493

offset,

3494

sidedata,

3494

sidedata,

3495

sidedata_offset,

3495

sidedata_offset,

3496

index_end,

3496

index_end,

3497

data_end,

3497

data_end,

3498

sidedata_end,

3498

sidedata_end,

3499

)

3499

)

3500

self._enforceinlinesize(transaction)

3500

self._enforceinlinesize(transaction)

3501

if self._docket is not None:

3501

if self._docket is not None:

3502

self._docket.index_end = files_end[0]

3502

self._docket.index_end = files_end[0]

3503

self._docket.data_end = files_end[1]

3503

self._docket.data_end = files_end[1]

3504

self._docket.sidedata_end = files_end[2]

3504

self._docket.sidedata_end = files_end[2]

3505

3506

nodemaputil.setup_persistent_nodemap(transaction, self)

3506

nodemaputil.setup_persistent_nodemap(transaction, self)

3507

3508

def addgroup(

3508

def addgroup(

3509

self,

3509

self,

3510

deltas,

3510

deltas,

3511

linkmapper,

3511

linkmapper,

3512

transaction,

3512

transaction,

3513

alwayscache=False,

3513

alwayscache=False,

3514

addrevisioncb=None,

3514

addrevisioncb=None,

3515

duplicaterevisioncb=None,

3515

duplicaterevisioncb=None,

3516

debug_info=None,

3516

debug_info=None,

3517

delta_base_reuse_policy=None,

3517

delta_base_reuse_policy=None,

3518

):

3518

):

3519

"""

3519

"""

3520

add a delta group

3520

add a delta group

3521

3522

given a set of deltas, add them to the revision log. the

3522

given a set of deltas, add them to the revision log. the

3523

first delta is against its parent, which should be in our

3523

first delta is against its parent, which should be in our

3524

log, the rest are against the previous delta.

3524

log, the rest are against the previous delta.

3525

3526

If ``addrevisioncb`` is defined, it will be called with arguments of

3526

If ``addrevisioncb`` is defined, it will be called with arguments of

3527

this revlog and the node that was added.

3527

this revlog and the node that was added.

3528

"""

3528

"""

3529

3530

if self._adding_group:

3530

if self._adding_group:

3531

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3531

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3532

3533

# read the default delta-base reuse policy from revlog config if the

3533

# read the default delta-base reuse policy from revlog config if the

3534

# group did not specify one.

3534

# group did not specify one.

3535

if delta_base_reuse_policy is None:

3535

if delta_base_reuse_policy is None:

3536

if (

3536

if (

3537

self.delta_config.general_delta

3537

self.delta_config.general_delta

3538

and self.delta_config.lazy_delta_base

3538

and self.delta_config.lazy_delta_base

3539

):

3539

):

3540

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3540

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3541

else:

3541

else:

3542

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3542

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3543

3544

self._adding_group = True

3544

self._adding_group = True

3545

empty = True

3545

empty = True

3546

try:

3546

try:

3547

with self._writing(transaction):

3547

with self._writing(transaction):

3548

write_debug = None

3548

write_debug = None

3549

if self.delta_config.debug_delta:

3549

if self.delta_config.debug_delta:

3550

write_debug = transaction._report

3550

write_debug = transaction._report

3551

deltacomputer = deltautil.deltacomputer(

3551

deltacomputer = deltautil.deltacomputer(

3552

self,

3552

self,

3553

write_debug=write_debug,

3553

write_debug=write_debug,

3554

debug_info=debug_info,

3554

debug_info=debug_info,

3555

)

3555

)

3556

# loop through our set of deltas

3556

# loop through our set of deltas

3557

for data in deltas:

3557

for data in deltas:

3558

(

3558

(

3559

node,

3559

node,

3560

p1,

3560

p1,

3561

p2,

3561

p2,

3562

linknode,

3562

linknode,

3563

deltabase,

3563

deltabase,

3564

delta,

3564

delta,

3565

flags,

3565

flags,

3566

sidedata,

3566

sidedata,

3567

) = data

3567

) = data

3568

link = linkmapper(linknode)

3568

link = linkmapper(linknode)

3569

flags = flags or REVIDX_DEFAULT_FLAGS

3569

flags = flags or REVIDX_DEFAULT_FLAGS

3570

3571

rev = self.index.get_rev(node)

3571

rev = self.index.get_rev(node)

3572

if rev is not None:

3572

if rev is not None:

3573

# this can happen if two branches make the same change

3573

# this can happen if two branches make the same change

3574

self._nodeduplicatecallback(transaction, rev)

3574

self._nodeduplicatecallback(transaction, rev)

3575

if duplicaterevisioncb:

3575

if duplicaterevisioncb:

3576

duplicaterevisioncb(self, rev)

3576

duplicaterevisioncb(self, rev)

3577

empty = False

3577

empty = False

3578

continue

3578

continue

3579

3580

for p in (p1, p2):

3580

for p in (p1, p2):

3581

if not self.index.has_node(p):

3581

if not self.index.has_node(p):

3582

raise error.LookupError(

3582

raise error.LookupError(

3583

p, self.radix, _(b'unknown parent')

3583

p, self.radix, _(b'unknown parent')

3584

)

3584

)

3585

3586

if not self.index.has_node(deltabase):

3586

if not self.index.has_node(deltabase):

3587

raise error.LookupError(

3587

raise error.LookupError(

3588

deltabase, self.display_id, _(b'unknown delta base')

3588

deltabase, self.display_id, _(b'unknown delta base')

3589

)

3589

)

3590

3591

baserev = self.rev(deltabase)

3591

baserev = self.rev(deltabase)

3592

3593

if baserev != nullrev and self.iscensored(baserev):

3593

if baserev != nullrev and self.iscensored(baserev):

3594

# if base is censored, delta must be full replacement in a

3594

# if base is censored, delta must be full replacement in a

3595

# single patch operation

3595

# single patch operation

3596

hlen = struct.calcsize(b">lll")

3596

hlen = struct.calcsize(b">lll")

3597

oldlen = self.rawsize(baserev)

3597

oldlen = self.rawsize(baserev)

3598

newlen = len(delta) - hlen

3598

newlen = len(delta) - hlen

3599

if delta[:hlen] != mdiff.replacediffheader(

3599

if delta[:hlen] != mdiff.replacediffheader(

3600

oldlen, newlen

3600

oldlen, newlen

3601

):

3601

):

3602

raise error.CensoredBaseError(

3602

raise error.CensoredBaseError(

3603

self.display_id, self.node(baserev)

3603

self.display_id, self.node(baserev)

3604

)

3604

)

3605

3606

if not flags and self._peek_iscensored(baserev, delta):

3606

if not flags and self._peek_iscensored(baserev, delta):

3607

flags |= REVIDX_ISCENSORED

3607

flags |= REVIDX_ISCENSORED

3608

3609

# We assume consumers of addrevisioncb will want to retrieve

3609

# We assume consumers of addrevisioncb will want to retrieve

3610

# the added revision, which will require a call to

3610

# the added revision, which will require a call to

3611

# revision(). revision() will fast path if there is a cache

3611

# revision(). revision() will fast path if there is a cache

3612

# hit. So, we tell _addrevision() to always cache in this case.

3612

# hit. So, we tell _addrevision() to always cache in this case.

3613

# We're only using addgroup() in the context of changegroup

3613

# We're only using addgroup() in the context of changegroup

3614

# generation so the revision data can always be handled as raw

3614

# generation so the revision data can always be handled as raw

3615

# by the flagprocessor.

3615

# by the flagprocessor.

3616

rev = self._addrevision(

3616

rev = self._addrevision(

3617

node,

3617

node,

3618

None,

3618

None,

3619

transaction,

3619

transaction,

3620

link,

3620

link,

3621

p1,

3621

p1,

3622

p2,

3622

p2,

3623

flags,

3623

flags,

3624

(baserev, delta, delta_base_reuse_policy),

3624

(baserev, delta, delta_base_reuse_policy),

3625

alwayscache=alwayscache,

3625

alwayscache=alwayscache,

3626

deltacomputer=deltacomputer,

3626

deltacomputer=deltacomputer,

3627

sidedata=sidedata,

3627

sidedata=sidedata,

3628

)

3628

)

3629

3630

if addrevisioncb:

3630

if addrevisioncb:

3631

addrevisioncb(self, rev)

3631

addrevisioncb(self, rev)

3632

empty = False

3632

empty = False

3633

finally:

3633

finally:

3634

self._adding_group = False

3634

self._adding_group = False

3635

return not empty

3635

return not empty

3636

3637

def iscensored(self, rev):

3637

def iscensored(self, rev):

3638

"""Check if a file revision is censored."""

3638

"""Check if a file revision is censored."""

3639

if not self.feature_config.censorable:

3639

if not self.feature_config.censorable:

3640

return False

3640

return False

3641

3642

return self.flags(rev) & REVIDX_ISCENSORED

3642

return self.flags(rev) & REVIDX_ISCENSORED

3643

3644

def _peek_iscensored(self, baserev, delta):

3644

def _peek_iscensored(self, baserev, delta):

3645

"""Quickly check if a delta produces a censored revision."""

3645

"""Quickly check if a delta produces a censored revision."""

3646

if not self.feature_config.censorable:

3646

if not self.feature_config.censorable:

3647

return False

3647

return False

3648

3649

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3649

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3650

3651

def getstrippoint(self, minlink):

3651

def getstrippoint(self, minlink):

3652

"""find the minimum rev that must be stripped to strip the linkrev

3652

"""find the minimum rev that must be stripped to strip the linkrev

3653

3654

Returns a tuple containing the minimum rev and a set of all revs that

3654

Returns a tuple containing the minimum rev and a set of all revs that

3655

have linkrevs that will be broken by this strip.

3655

have linkrevs that will be broken by this strip.

3656

"""

3656

"""

3657

return storageutil.resolvestripinfo(

3657

return storageutil.resolvestripinfo(

3658

minlink,

3658

minlink,

3659

len(self) - 1,

3659

len(self) - 1,

3660

self.headrevs(),

3660

self.headrevs(),

3661

self.linkrev,

3661

self.linkrev,

3662

self.parentrevs,

3662

self.parentrevs,

3663

)

3663

)

3664

3665

def strip(self, minlink, transaction):

3665

def strip(self, minlink, transaction):

3666

"""truncate the revlog on the first revision with a linkrev >= minlink

3666

"""truncate the revlog on the first revision with a linkrev >= minlink

3667

3668

This function is called when we're stripping revision minlink and

3668

This function is called when we're stripping revision minlink and

3669

its descendants from the repository.

3669

its descendants from the repository.

3670

3671

We have to remove all revisions with linkrev >= minlink, because

3671

We have to remove all revisions with linkrev >= minlink, because

3672

the equivalent changelog revisions will be renumbered after the

3672

the equivalent changelog revisions will be renumbered after the

3673

strip.

3673

strip.

3674

3675

So we truncate the revlog on the first of these revisions, and

3675

So we truncate the revlog on the first of these revisions, and

3676

trust that the caller has saved the revisions that shouldn't be

3676

trust that the caller has saved the revisions that shouldn't be

3677

removed and that it'll re-add them after this truncation.

3677

removed and that it'll re-add them after this truncation.

3678

"""

3678

"""

3679

if len(self) == 0:

3679

if len(self) == 0:

3680

return

3680

return

3681

3682

rev, _ = self.getstrippoint(minlink)

3682

rev, _ = self.getstrippoint(minlink)

3683

if rev == len(self):

3683

if rev == len(self):

3684

return

3684

return

3685

3686

# first truncate the files on disk

3686

# first truncate the files on disk

3687

data_end = self.start(rev)

3687

data_end = self.start(rev)

3688

if not self._inline:

3688

if not self._inline:

3689

transaction.add(self._datafile, data_end)

3689

transaction.add(self._datafile, data_end)

3690

end = rev * self.index.entry_size

3690

end = rev * self.index.entry_size

3691

else:

3691

else:

3692

end = data_end + (rev * self.index.entry_size)

3692

end = data_end + (rev * self.index.entry_size)

3693

3694

if self._sidedatafile:

3694

if self._sidedatafile:

3695

sidedata_end = self.sidedata_cut_off(rev)

3695

sidedata_end = self.sidedata_cut_off(rev)

3696

transaction.add(self._sidedatafile, sidedata_end)

3696

transaction.add(self._sidedatafile, sidedata_end)

3697

3698

transaction.add(self._indexfile, end)

3698

transaction.add(self._indexfile, end)

3699

if self._docket is not None:

3699

if self._docket is not None:

3700

# XXX we could, leverage the docket while stripping. However it is

3700

# XXX we could, leverage the docket while stripping. However it is

3701

# not powerfull enough at the time of this comment

3701

# not powerfull enough at the time of this comment

3702

self._docket.index_end = end

3702

self._docket.index_end = end

3703

self._docket.data_end = data_end

3703

self._docket.data_end = data_end

3704

self._docket.sidedata_end = sidedata_end

3704

self._docket.sidedata_end = sidedata_end

3705

self._docket.write(transaction, stripping=True)

3705

self._docket.write(transaction, stripping=True)

3706

3707

# then reset internal state in memory to forget those revisions

3707

# then reset internal state in memory to forget those revisions

3708

self._chaininfocache = util.lrucachedict(500)

3708

self._chaininfocache = util.lrucachedict(500)

3709

self._inner.clear_cache()

3709

self._inner.clear_cache()

3710

3711

del self.index[rev:-1]

3711

del self.index[rev:-1]

3712

3713

def checksize(self):

3713

def checksize(self):

3714

"""Check size of index and data files

3714

"""Check size of index and data files

3715

3716

return a (dd, di) tuple.

3716

return a (dd, di) tuple.

3717

- dd: extra bytes for the "data" file

3717

- dd: extra bytes for the "data" file

3718

- di: extra bytes for the "index" file

3718

- di: extra bytes for the "index" file

3719

3720

A healthy revlog will return (0, 0).

3720

A healthy revlog will return (0, 0).

3721

"""

3721

"""

3722

expected = 0

3722

expected = 0

3723

if len(self):

3723

if len(self):

3724

expected = max(0, self.end(len(self) - 1))

3724

expected = max(0, self.end(len(self) - 1))

3725

3726

try:

3726

try:

3727

with self._datafp() as f:

3727

with self._datafp() as f:

3728

f.seek(0, io.SEEK_END)

3728

f.seek(0, io.SEEK_END)

3729

actual = f.tell()

3729

actual = f.tell()

3730

dd = actual - expected

3730

dd = actual - expected

3731

except FileNotFoundError:

3731

except FileNotFoundError:

3732

dd = 0

3732

dd = 0

3733

3734

try:

3734

try:

3735

f = self.opener(self._indexfile)

3735

f = self.opener(self._indexfile)

3736

f.seek(0, io.SEEK_END)

3736

f.seek(0, io.SEEK_END)

3737

actual = f.tell()

3737

actual = f.tell()

3738

f.close()

3738

f.close()

3739

s = self.index.entry_size

3739

s = self.index.entry_size

3740

i = max(0, actual // s)

3740

i = max(0, actual // s)

3741

di = actual - (i * s)

3741

di = actual - (i * s)

3742

if self._inline:

3742

if self._inline:

3743

databytes = 0

3743

databytes = 0

3744

for r in self:

3744

for r in self:

3745

databytes += max(0, self.length(r))

3745

databytes += max(0, self.length(r))

3746

dd = 0

3746

dd = 0

3747

di = actual - len(self) * s - databytes

3747

di = actual - len(self) * s - databytes

3748

except FileNotFoundError:

3748

except FileNotFoundError:

3749

di = 0

3749

di = 0

3750

3751

return (dd, di)

3751

return (dd, di)

3752

3753

def files(self):

3753

def files(self):

3754

"""return list of files that compose this revlog"""

3754

"""return list of files that compose this revlog"""

3755

res = [self._indexfile]

3755

res = [self._indexfile]

3756

if self._docket_file is None:

3756

if self._docket_file is None:

3757

if not self._inline:

3757

if not self._inline:

3758

res.append(self._datafile)

3758

res.append(self._datafile)

3759

else:

3759

else:

3760

res.append(self._docket_file)

3760

res.append(self._docket_file)

3761

res.extend(self._docket.old_index_filepaths(include_empty=False))

3761

res.extend(self._docket.old_index_filepaths(include_empty=False))

3762

if self._docket.data_end:

3762

if self._docket.data_end:

3763

res.append(self._datafile)

3763

res.append(self._datafile)

3764

res.extend(self._docket.old_data_filepaths(include_empty=False))

3764

res.extend(self._docket.old_data_filepaths(include_empty=False))

3765

if self._docket.sidedata_end:

3765

if self._docket.sidedata_end:

3766

res.append(self._sidedatafile)

3766

res.append(self._sidedatafile)

3767

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3767

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3768

return res

3768

return res

3769

3770

def emitrevisions(

3770

def emitrevisions(

3771

self,

3771

self,

3772

nodes,

3772

nodes,

3773

nodesorder=None,

3773

nodesorder=None,

3774

revisiondata=False,

3774

revisiondata=False,

3775

assumehaveparentrevisions=False,

3775

assumehaveparentrevisions=False,

3776

deltamode=repository.CG_DELTAMODE_STD,

3776

deltamode=repository.CG_DELTAMODE_STD,

3777

sidedata_helpers=None,

3777

sidedata_helpers=None,

3778

debug_info=None,

3778

debug_info=None,

3779

):

3779

):

3780

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3780

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3781

raise error.ProgrammingError(

3781

raise error.ProgrammingError(

3782

b'unhandled value for nodesorder: %s' % nodesorder

3782

b'unhandled value for nodesorder: %s' % nodesorder

3783

)

3783

)

3784

3785

if nodesorder is None and not self.delta_config.general_delta:

3785

if nodesorder is None and not self.delta_config.general_delta:

3786

nodesorder = b'storage'

3786

nodesorder = b'storage'

3787

3788

if (

3788

if (

3789

not self._storedeltachains

3789

not self._storedeltachains

3790

and deltamode != repository.CG_DELTAMODE_PREV

3790

and deltamode != repository.CG_DELTAMODE_PREV

3791

):

3791

):

3792

deltamode = repository.CG_DELTAMODE_FULL

3792

deltamode = repository.CG_DELTAMODE_FULL

3793

3794

return storageutil.emitrevisions(

3794

return storageutil.emitrevisions(

3795

self,

3795

self,

3796

nodes,

3796

nodes,

3797

nodesorder,

3797

nodesorder,

3798

revlogrevisiondelta,

3798

revlogrevisiondelta,

3799

deltaparentfn=self.deltaparent,

3799

deltaparentfn=self.deltaparent,

3800

candeltafn=self._candelta,

3800

candeltafn=self._candelta,

3801

rawsizefn=self.rawsize,

3801

rawsizefn=self.rawsize,

3802

revdifffn=self.revdiff,

3802

revdifffn=self.revdiff,

3803

flagsfn=self.flags,

3803

flagsfn=self.flags,

3804

deltamode=deltamode,

3804

deltamode=deltamode,

3805

revisiondata=revisiondata,

3805

revisiondata=revisiondata,

3806

assumehaveparentrevisions=assumehaveparentrevisions,

3806

assumehaveparentrevisions=assumehaveparentrevisions,

3807

sidedata_helpers=sidedata_helpers,

3807

sidedata_helpers=sidedata_helpers,

3808

debug_info=debug_info,

3808

debug_info=debug_info,

3809

)

3809

)

3810

3811

DELTAREUSEALWAYS = b'always'

3811

DELTAREUSEALWAYS = b'always'

3812

DELTAREUSESAMEREVS = b'samerevs'

3812

DELTAREUSESAMEREVS = b'samerevs'

3813

DELTAREUSENEVER = b'never'

3813

DELTAREUSENEVER = b'never'

3814

3815

DELTAREUSEFULLADD = b'fulladd'

3815

DELTAREUSEFULLADD = b'fulladd'

3816

3817

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3817

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3818

3819

def clone(

3819

def clone(

3820

self,

3820

self,

3821

tr,

3821

tr,

3822

destrevlog,

3822

destrevlog,

3823

addrevisioncb=None,

3823

addrevisioncb=None,

3824

deltareuse=DELTAREUSESAMEREVS,

3824

deltareuse=DELTAREUSESAMEREVS,

3825

forcedeltabothparents=None,

3825

forcedeltabothparents=None,

3826

sidedata_helpers=None,

3826

sidedata_helpers=None,

3827

):

3827

):

3828

"""Copy this revlog to another, possibly with format changes.

3828

"""Copy this revlog to another, possibly with format changes.

3829

3830

The destination revlog will contain the same revisions and nodes.

3830

The destination revlog will contain the same revisions and nodes.

3831

However, it may not be bit-for-bit identical due to e.g. delta encoding

3831

However, it may not be bit-for-bit identical due to e.g. delta encoding

3832

differences.

3832

differences.

3833

3834

The ``deltareuse`` argument control how deltas from the existing revlog

3834

The ``deltareuse`` argument control how deltas from the existing revlog

3835

are preserved in the destination revlog. The argument can have the

3835

are preserved in the destination revlog. The argument can have the

3836

following values:

3836

following values:

3837

3838

DELTAREUSEALWAYS

3838

DELTAREUSEALWAYS

3839

Deltas will always be reused (if possible), even if the destination

3839

Deltas will always be reused (if possible), even if the destination

3840

revlog would not select the same revisions for the delta. This is the

3840

revlog would not select the same revisions for the delta. This is the

3841

fastest mode of operation.

3841

fastest mode of operation.

3842

DELTAREUSESAMEREVS

3842

DELTAREUSESAMEREVS

3843

Deltas will be reused if the destination revlog would pick the same

3843

Deltas will be reused if the destination revlog would pick the same

3844

revisions for the delta. This mode strikes a balance between speed

3844

revisions for the delta. This mode strikes a balance between speed

3845

and optimization.

3845

and optimization.

3846

DELTAREUSENEVER

3846

DELTAREUSENEVER

3847

Deltas will never be reused. This is the slowest mode of execution.

3847

Deltas will never be reused. This is the slowest mode of execution.

3848

This mode can be used to recompute deltas (e.g. if the diff/delta

3848

This mode can be used to recompute deltas (e.g. if the diff/delta

3849

algorithm changes).

3849

algorithm changes).

3850

DELTAREUSEFULLADD

3850

DELTAREUSEFULLADD

3851

Revision will be re-added as if their were new content. This is

3851

Revision will be re-added as if their were new content. This is

3852

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3852

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3853

eg: large file detection and handling.

3853

eg: large file detection and handling.

3854

3855

Delta computation can be slow, so the choice of delta reuse policy can

3855

Delta computation can be slow, so the choice of delta reuse policy can

3856

significantly affect run time.

3856

significantly affect run time.

3857

3858

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3858

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3859

two extremes. Deltas will be reused if they are appropriate. But if the

3859

two extremes. Deltas will be reused if they are appropriate. But if the

3860

delta could choose a better revision, it will do so. This means if you

3860

delta could choose a better revision, it will do so. This means if you

3861

are converting a non-generaldelta revlog to a generaldelta revlog,

3861

are converting a non-generaldelta revlog to a generaldelta revlog,

3862

deltas will be recomputed if the delta's parent isn't a parent of the

3862

deltas will be recomputed if the delta's parent isn't a parent of the

3863

revision.

3863

revision.

3864

3865

In addition to the delta policy, the ``forcedeltabothparents``

3865

In addition to the delta policy, the ``forcedeltabothparents``

3866

argument controls whether to force compute deltas against both parents

3866

argument controls whether to force compute deltas against both parents

3867

for merges. By default, the current default is used.

3867

for merges. By default, the current default is used.

3868

3869

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3869

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3870

`sidedata_helpers`.

3870

`sidedata_helpers`.

3871

"""

3871

"""

3872

if deltareuse not in self.DELTAREUSEALL:

3872

if deltareuse not in self.DELTAREUSEALL:

3873

raise ValueError(

3873

raise ValueError(

3874

_(b'value for deltareuse invalid: %s') % deltareuse

3874

_(b'value for deltareuse invalid: %s') % deltareuse

3875

)

3875

)

3876

3877

if len(destrevlog):

3877

if len(destrevlog):

3878

raise ValueError(_(b'destination revlog is not empty'))

3878

raise ValueError(_(b'destination revlog is not empty'))

3879

3880

if getattr(self, 'filteredrevs', None):

3880

if getattr(self, 'filteredrevs', None):

3881

raise ValueError(_(b'source revlog has filtered revisions'))

3881

raise ValueError(_(b'source revlog has filtered revisions'))

3882

if getattr(destrevlog, 'filteredrevs', None):

3882

if getattr(destrevlog, 'filteredrevs', None):

3883

raise ValueError(_(b'destination revlog has filtered revisions'))

3883

raise ValueError(_(b'destination revlog has filtered revisions'))

3884

3885

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3885

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3886

# if possible.

3886

# if possible.

3887

old_delta_config = destrevlog.delta_config

3887

old_delta_config = destrevlog.delta_config

3888

destrevlog.delta_config = destrevlog.delta_config.copy()

3888

destrevlog.delta_config = destrevlog.delta_config.copy()

3889

3890

try:

3890

try:

3891

if deltareuse == self.DELTAREUSEALWAYS:

3891

if deltareuse == self.DELTAREUSEALWAYS:

3892

destrevlog.delta_config.lazy_delta_base = True

3892

destrevlog.delta_config.lazy_delta_base = True

3893

destrevlog.delta_config.lazy_delta = True

3893

destrevlog.delta_config.lazy_delta = True

3894

elif deltareuse == self.DELTAREUSESAMEREVS:

3894

elif deltareuse == self.DELTAREUSESAMEREVS:

3895

destrevlog.delta_config.lazy_delta_base = False

3895

destrevlog.delta_config.lazy_delta_base = False

3896

destrevlog.delta_config.lazy_delta = True

3896

destrevlog.delta_config.lazy_delta = True

3897

elif deltareuse == self.DELTAREUSENEVER:

3897

elif deltareuse == self.DELTAREUSENEVER:

3898

destrevlog.delta_config.lazy_delta_base = False

3898

destrevlog.delta_config.lazy_delta_base = False

3899

destrevlog.delta_config.lazy_delta = False

3899

destrevlog.delta_config.lazy_delta = False

3900

3901

delta_both_parents = (

3901

delta_both_parents = (

3902

forcedeltabothparents or old_delta_config.delta_both_parents

3902

forcedeltabothparents or old_delta_config.delta_both_parents

3903

)

3903

)

3904

destrevlog.delta_config.delta_both_parents = delta_both_parents

3904

destrevlog.delta_config.delta_both_parents = delta_both_parents

3905

3906

with self.reading(), destrevlog._writing(tr):

3906

with self.reading(), destrevlog._writing(tr):

3907

self._clone(

3907

self._clone(

3908

tr,

3908

tr,

3909

destrevlog,

3909

destrevlog,

3910

addrevisioncb,

3910

addrevisioncb,

3911

deltareuse,

3911

deltareuse,

3912

forcedeltabothparents,

3912

forcedeltabothparents,

3913

sidedata_helpers,

3913

sidedata_helpers,

3914

)

3914

)

3915

3916

finally:

3916

finally:

3917

destrevlog.delta_config = old_delta_config

3917

destrevlog.delta_config = old_delta_config

3918

3919

def _clone(

3919

def _clone(

3920

self,

3920

self,

3921

tr,

3921

tr,

3922

destrevlog,

3922

destrevlog,

3923

addrevisioncb,

3923

addrevisioncb,

3924

deltareuse,

3924

deltareuse,

3925

forcedeltabothparents,

3925

forcedeltabothparents,

3926

sidedata_helpers,

3926

sidedata_helpers,

3927

):

3927

):

3928

"""perform the core duty of `revlog.clone` after parameter processing"""

3928

"""perform the core duty of `revlog.clone` after parameter processing"""

3929

write_debug = None

3929

write_debug = None

3930

if self.delta_config.debug_delta:

3930

if self.delta_config.debug_delta:

3931

write_debug = tr._report

3931

write_debug = tr._report

3932

deltacomputer = deltautil.deltacomputer(

3932

deltacomputer = deltautil.deltacomputer(

3933

destrevlog,

3933

destrevlog,

3934

write_debug=write_debug,

3934

write_debug=write_debug,

3935

)

3935

)

3936

index = self.index

3936

index = self.index

3937

for rev in self:

3937

for rev in self:

3938

entry = index[rev]

3938

entry = index[rev]

3939

3940

# Some classes override linkrev to take filtered revs into

3940

# Some classes override linkrev to take filtered revs into

3941

# account. Use raw entry from index.

3941

# account. Use raw entry from index.

3942

flags = entry[0] & 0xFFFF

3942

flags = entry[0] & 0xFFFF

3943

linkrev = entry[4]

3943

linkrev = entry[4]

3944

p1 = index[entry[5]][7]

3944

p1 = index[entry[5]][7]

3945

p2 = index[entry[6]][7]

3945

p2 = index[entry[6]][7]

3946

node = entry[7]

3946

node = entry[7]

3947

3948

# (Possibly) reuse the delta from the revlog if allowed and

3948

# (Possibly) reuse the delta from the revlog if allowed and

3949

# the revlog chunk is a delta.

3949

# the revlog chunk is a delta.

3950

cachedelta = None

3950

cachedelta = None

3951

rawtext = None

3951

rawtext = None

3952

if deltareuse == self.DELTAREUSEFULLADD:

3952

if deltareuse == self.DELTAREUSEFULLADD:

3953

text = self._revisiondata(rev)

3953

text = self._revisiondata(rev)

3954

sidedata = self.sidedata(rev)

3954

sidedata = self.sidedata(rev)

3955

3956

if sidedata_helpers is not None:

3956

if sidedata_helpers is not None:

3957

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3957

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3958

self, sidedata_helpers, sidedata, rev

3958

self, sidedata_helpers, sidedata, rev

3959

)

3959

)

3960

flags = flags | new_flags[0] & ~new_flags[1]

3960

flags = flags | new_flags[0] & ~new_flags[1]

3961

3962

destrevlog.addrevision(

3962

destrevlog.addrevision(

3963

text,

3963

text,

3964

tr,

3964

tr,

3965

linkrev,

3965

linkrev,

3966

p1,

3966

p1,

3967

p2,

3967

p2,

3968

cachedelta=cachedelta,

3968

cachedelta=cachedelta,

3969

node=node,

3969

node=node,

3970

flags=flags,

3970

flags=flags,

3971

deltacomputer=deltacomputer,

3971

deltacomputer=deltacomputer,

3972

sidedata=sidedata,

3972

sidedata=sidedata,

3973

)

3973

)

3974

else:

3974

else:

3975

if destrevlog.delta_config.lazy_delta:

3975

if destrevlog.delta_config.lazy_delta:

3976

dp = self.deltaparent(rev)

3976

dp = self.deltaparent(rev)

3977

if dp != nullrev:

3977

if dp != nullrev:

3978

cachedelta = (dp, bytes(self._inner._chunk(rev)))

3978

cachedelta = (dp, bytes(self._inner._chunk(rev)))

3979

3980

sidedata = None

3980

sidedata = None

3981

if not cachedelta:

3981

if not cachedelta:

3982

try:

3982

try:

3983

rawtext = self._revisiondata(rev)

3983

rawtext = self._revisiondata(rev)

3984

except error.CensoredNodeError as censored:

3984

except error.CensoredNodeError as censored:

3985

assert flags & REVIDX_ISCENSORED

3985

assert flags & REVIDX_ISCENSORED

3986

rawtext = censored.tombstone

3986

rawtext = censored.tombstone

3987

sidedata = self.sidedata(rev)

3987

sidedata = self.sidedata(rev)

3988

if sidedata is None:

3988

if sidedata is None:

3989

sidedata = self.sidedata(rev)

3989

sidedata = self.sidedata(rev)

3990

3991

if sidedata_helpers is not None:

3991

if sidedata_helpers is not None:

3992

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3992

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3993

self, sidedata_helpers, sidedata, rev

3993

self, sidedata_helpers, sidedata, rev

3994

)

3994

)

3995

flags = flags | new_flags[0] & ~new_flags[1]

3995

flags = flags | new_flags[0] & ~new_flags[1]

3996

3997

destrevlog._addrevision(

3997

destrevlog._addrevision(

3998

node,

3998

node,

3999

rawtext,

3999

rawtext,

4000

tr,

4000

tr,

4001

linkrev,

4001

linkrev,

4002

p1,

4002

p1,

4003

p2,

4003

p2,

4004

flags,

4004

flags,

4005

cachedelta,

4005

cachedelta,

4006

deltacomputer=deltacomputer,

4006

deltacomputer=deltacomputer,

4007

sidedata=sidedata,

4007

sidedata=sidedata,

4008

)

4008

)

4009

4010

if addrevisioncb:

4010

if addrevisioncb:

4011

addrevisioncb(self, rev, node)

4011

addrevisioncb(self, rev, node)

4012

4013

def censorrevision(self, tr, censor_nodes, tombstone=b''):

4013

def censorrevision(self, tr, censor_nodes, tombstone=b''):

4014

if self._format_version == REVLOGV0:

4014

if self._format_version == REVLOGV0:

4015

raise error.RevlogError(

4015

raise error.RevlogError(

4016

_(b'cannot censor with version %d revlogs')

4016

_(b'cannot censor with version %d revlogs')

4017

% self._format_version

4017

% self._format_version

4018

)

4018

)

4019

elif self._format_version == REVLOGV1:

4019

elif self._format_version == REVLOGV1:

4020

rewrite.v1_censor(self, tr, censor_nodes, tombstone)

4020

rewrite.v1_censor(self, tr, censor_nodes, tombstone)

4021

else:

4021

else:

4022

rewrite.v2_censor(self, tr, censor_nodes, tombstone)

4022

rewrite.v2_censor(self, tr, censor_nodes, tombstone)

4023

4024

def verifyintegrity(self, state) -> Iterable[repository.iverifyproblem]:

4024

def verifyintegrity(self, state) -> Iterable[repository.iverifyproblem]:

4025

"""Verifies the integrity of the revlog.

4025

"""Verifies the integrity of the revlog.

4026

4027

Yields ``revlogproblem`` instances describing problems that are

4027

Yields ``revlogproblem`` instances describing problems that are

4028

found.

4028

found.

4029

"""

4029

"""

4030

dd, di = self.checksize()

4030

dd, di = self.checksize()

4031

if dd:

4031

if dd:

4032

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

4032

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

4033

if di:

4033

if di:

4034

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

4034

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

4035

4036

version = self._format_version

4036

version = self._format_version

4037

4038

# The verifier tells us what version revlog we should be.

4038

# The verifier tells us what version revlog we should be.

4039

if version != state[b'expectedversion']:

4039

if version != state[b'expectedversion']:

4040

yield revlogproblem(

4040

yield revlogproblem(

4041

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

4041

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

4042

% (self.display_id, version, state[b'expectedversion'])

4042

% (self.display_id, version, state[b'expectedversion'])

4043

)

4043

)

4044

4045

state[b'skipread'] = set()

4045

state[b'skipread'] = set()

4046

state[b'safe_renamed'] = set()

4046

state[b'safe_renamed'] = set()

4047

4048

for rev in self:

4048

for rev in self:

4049

node = self.node(rev)

4049

node = self.node(rev)

4050

4051

# Verify contents. 4 cases to care about:

4051

# Verify contents. 4 cases to care about:

4052

#

4052

#

4053

# common: the most common case

4053

# common: the most common case

4054

# rename: with a rename

4054

# rename: with a rename

4055

# meta: file content starts with b'\1\n', the metadata

4055

# meta: file content starts with b'\1\n', the metadata

4056

# header defined in filelog.py, but without a rename

4056

# header defined in filelog.py, but without a rename

4057

# ext: content stored externally

4057

# ext: content stored externally

4058

#

4058

#

4059

# More formally, their differences are shown below:

4059

# More formally, their differences are shown below:

4060

#

4060

#

4061

# | common | rename | meta | ext

4061

# | common | rename | meta | ext

4062

# -------------------------------------------------------

4062

# -------------------------------------------------------

4063

# flags() | 0 | 0 | 0 | not 0

4063

# flags() | 0 | 0 | 0 | not 0

4064

# renamed() | False | True | False | ?

4064

# renamed() | False | True | False | ?

4065

# rawtext[0:2]=='\1\n'| False | True | True | ?

4065

# rawtext[0:2]=='\1\n'| False | True | True | ?

4066

#

4066

#

4067

# "rawtext" means the raw text stored in revlog data, which

4067

# "rawtext" means the raw text stored in revlog data, which

4068

# could be retrieved by "rawdata(rev)". "text"

4068

# could be retrieved by "rawdata(rev)". "text"

4069

# mentioned below is "revision(rev)".

4069

# mentioned below is "revision(rev)".

4070

#

4070

#

4071

# There are 3 different lengths stored physically:

4071

# There are 3 different lengths stored physically:

4072

# 1. L1: rawsize, stored in revlog index

4072

# 1. L1: rawsize, stored in revlog index

4073

# 2. L2: len(rawtext), stored in revlog data

4073

# 2. L2: len(rawtext), stored in revlog data

4074

# 3. L3: len(text), stored in revlog data if flags==0, or

4074

# 3. L3: len(text), stored in revlog data if flags==0, or

4075

# possibly somewhere else if flags!=0

4075

# possibly somewhere else if flags!=0

4076

#

4076

#

4077

# L1 should be equal to L2. L3 could be different from them.

4077

# L1 should be equal to L2. L3 could be different from them.

4078

# "text" may or may not affect commit hash depending on flag

4078

# "text" may or may not affect commit hash depending on flag

4079

# processors (see flagutil.addflagprocessor).

4079

# processors (see flagutil.addflagprocessor).

4080

#

4080

#

4081

# | common | rename | meta | ext

4081

# | common | rename | meta | ext

4082

# -------------------------------------------------

4082

# -------------------------------------------------

4083

# rawsize() | L1 | L1 | L1 | L1

4083

# rawsize() | L1 | L1 | L1 | L1

4084

# size() | L1 | L2-LM | L1(*) | L1 (?)

4084

# size() | L1 | L2-LM | L1(*) | L1 (?)

4085

# len(rawtext) | L2 | L2 | L2 | L2

4085

# len(rawtext) | L2 | L2 | L2 | L2

4086

# len(text) | L2 | L2 | L2 | L3

4086

# len(text) | L2 | L2 | L2 | L3

4087

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

4087

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

4088

#

4088

#

4089

# LM: length of metadata, depending on rawtext

4089

# LM: length of metadata, depending on rawtext

4090

# (*): not ideal, see comment in filelog.size

4090

# (*): not ideal, see comment in filelog.size

4091

# (?): could be "- len(meta)" if the resolved content has

4091

# (?): could be "- len(meta)" if the resolved content has

4092

# rename metadata

4092

# rename metadata

4093

#

4093

#

4094

# Checks needed to be done:

4094

# Checks needed to be done:

4095

# 1. length check: L1 == L2, in all cases.

4095

# 1. length check: L1 == L2, in all cases.

4096

# 2. hash check: depending on flag processor, we may need to

4096

# 2. hash check: depending on flag processor, we may need to

4097

# use either "text" (external), or "rawtext" (in revlog).

4097

# use either "text" (external), or "rawtext" (in revlog).

4098

4099

try:

4099

try:

4100

skipflags = state.get(b'skipflags', 0)

4100

skipflags = state.get(b'skipflags', 0)

4101

if skipflags:

4101

if skipflags:

4102

skipflags &= self.flags(rev)

4102

skipflags &= self.flags(rev)

4103

4104

_verify_revision(self, skipflags, state, node)

4104

_verify_revision(self, skipflags, state, node)

4105

4106

l1 = self.rawsize(rev)

4106

l1 = self.rawsize(rev)

4107

l2 = len(self.rawdata(node))

4107

l2 = len(self.rawdata(node))

4108

4109

if l1 != l2:

4109

if l1 != l2:

4110

yield revlogproblem(

4110

yield revlogproblem(

4111

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

4111

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

4112

node=node,

4112

node=node,

4113

)

4113

)

4114

4115

except error.CensoredNodeError:

4115

except error.CensoredNodeError:

4116

if state[b'erroroncensored']:

4116

if state[b'erroroncensored']:

4117

yield revlogproblem(

4117

yield revlogproblem(

4118

error=_(b'censored file data'), node=node

4118

error=_(b'censored file data'), node=node

4119

)

4119

)

4120

state[b'skipread'].add(node)

4120

state[b'skipread'].add(node)

4121

except Exception as e:

4121

except Exception as e:

4122

yield revlogproblem(

4122

yield revlogproblem(

4123

error=_(b'unpacking %s: %s')

4123

error=_(b'unpacking %s: %s')

4124

% (short(node), stringutil.forcebytestr(e)),

4124

% (short(node), stringutil.forcebytestr(e)),

4125

node=node,

4125

node=node,

4126

)

4126

)

4127

state[b'skipread'].add(node)

4127

state[b'skipread'].add(node)

4128

4129

def storageinfo(

4129

def storageinfo(

4130

self,

4130

self,

4131

exclusivefiles=False,

4131

exclusivefiles=False,

4132

sharedfiles=False,

4132

sharedfiles=False,

4133

revisionscount=False,

4133

revisionscount=False,

4134

trackedsize=False,

4134

trackedsize=False,

4135

storedsize=False,

4135

storedsize=False,

4136

):

4136

):

4137

d = {}

4137

d = {}

4138

4139

if exclusivefiles:

4139

if exclusivefiles:

4140

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

4140

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

4141

if not self._inline:

4141

if not self._inline:

4142

d[b'exclusivefiles'].append((self.opener, self._datafile))

4142

d[b'exclusivefiles'].append((self.opener, self._datafile))

4143

4144

if sharedfiles:

4144

if sharedfiles:

4145

d[b'sharedfiles'] = []

4145

d[b'sharedfiles'] = []

4146

4147

if revisionscount:

4147

if revisionscount:

4148

d[b'revisionscount'] = len(self)

4148

d[b'revisionscount'] = len(self)

4149

4150

if trackedsize:

4150

if trackedsize:

4151

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

4151

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

4152

4153

if storedsize:

4153

if storedsize:

4154

d[b'storedsize'] = sum(

4154

d[b'storedsize'] = sum(

4155

self.opener.stat(path).st_size for path in self.files()

4155

self.opener.stat(path).st_size for path in self.files()

4156

)

4156

)

4157

4158

return d

4158

return d

4159

4160

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

4160

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

4161

if not self.feature_config.has_side_data:

4161

if not self.feature_config.has_side_data:

4162

return

4162

return

4163

# revlog formats with sidedata support does not support inline

4163

# revlog formats with sidedata support does not support inline

4164

assert not self._inline

4164

assert not self._inline

4165

if not helpers[1] and not helpers[2]:

4165

if not helpers[1] and not helpers[2]:

4166

# Nothing to generate or remove

4166

# Nothing to generate or remove

4167

return

4167

return

4168

4169

new_entries = []

4169

new_entries = []

4170

# append the new sidedata

4170

# append the new sidedata

4171

with self._writing(transaction):

4171

with self._writing(transaction):

4172

ifh, dfh, sdfh = self._inner._writinghandles

4172

ifh, dfh, sdfh = self._inner._writinghandles

4173

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

4173

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

4174

4175

current_offset = sdfh.tell()

4175

current_offset = sdfh.tell()

4176

for rev in range(startrev, endrev + 1):

4176

for rev in range(startrev, endrev + 1):

4177

entry = self.index[rev]

4177

entry = self.index[rev]

4178

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

4178

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

4179

store=self,

4179

store=self,

4180

sidedata_helpers=helpers,

4180

sidedata_helpers=helpers,

4181

sidedata={},

4181

sidedata={},

4182

rev=rev,

4182

rev=rev,

4183

)

4183

)

4184

4185

serialized_sidedata = sidedatautil.serialize_sidedata(

4185

serialized_sidedata = sidedatautil.serialize_sidedata(

4186

new_sidedata

4186

new_sidedata

4187

)

4187

)

4188

4189

sidedata_compression_mode = COMP_MODE_INLINE

4189

sidedata_compression_mode = COMP_MODE_INLINE

4190

if serialized_sidedata and self.feature_config.has_side_data:

4190

if serialized_sidedata and self.feature_config.has_side_data:

4191

sidedata_compression_mode = COMP_MODE_PLAIN

4191

sidedata_compression_mode = COMP_MODE_PLAIN

4192

h, comp_sidedata = self._inner.compress(serialized_sidedata)

4192

h, comp_sidedata = self._inner.compress(serialized_sidedata)

4193

if (

4193

if (

4194

h != b'u'

4194

h != b'u'

4195

and comp_sidedata[0] != b'\0'

4195

and comp_sidedata[0] != b'\0'

4196

and len(comp_sidedata) < len(serialized_sidedata)

4196

and len(comp_sidedata) < len(serialized_sidedata)

4197

):

4197

):

4198

assert not h

4198

assert not h

4199

if (

4199

if (

4200

comp_sidedata[0]

4200

comp_sidedata[0]

4201

== self._docket.default_compression_header

4201

== self._docket.default_compression_header

4202

):

4202

):

4203

sidedata_compression_mode = COMP_MODE_DEFAULT

4203

sidedata_compression_mode = COMP_MODE_DEFAULT

4204

serialized_sidedata = comp_sidedata

4204

serialized_sidedata = comp_sidedata

4205

else:

4205

else:

4206

sidedata_compression_mode = COMP_MODE_INLINE

4206

sidedata_compression_mode = COMP_MODE_INLINE

4207

serialized_sidedata = comp_sidedata

4207

serialized_sidedata = comp_sidedata

4208

if entry[8] != 0 or entry[9] != 0:

4208

if entry[8] != 0 or entry[9] != 0:

4209

# rewriting entries that already have sidedata is not

4209

# rewriting entries that already have sidedata is not

4210

# supported yet, because it introduces garbage data in the

4210

# supported yet, because it introduces garbage data in the

4211

# revlog.

4211

# revlog.

4212

msg = b"rewriting existing sidedata is not supported yet"

4212

msg = b"rewriting existing sidedata is not supported yet"

4213

raise error.Abort(msg)

4213

raise error.Abort(msg)

4214

4215

# Apply (potential) flags to add and to remove after running

4215

# Apply (potential) flags to add and to remove after running

4216

# the sidedata helpers

4216

# the sidedata helpers

4217

new_offset_flags = entry[0] | flags[0] & ~flags[1]

4217

new_offset_flags = entry[0] | flags[0] & ~flags[1]

4218

entry_update = (

4218

entry_update = (

4219

current_offset,

4219

current_offset,

4220

len(serialized_sidedata),

4220

len(serialized_sidedata),

4221

new_offset_flags,

4221

new_offset_flags,

4222

sidedata_compression_mode,

4222

sidedata_compression_mode,

4223

)

4223

)

4224

4225

# the sidedata computation might have move the file cursors around

4225

# the sidedata computation might have move the file cursors around

4226

sdfh.seek(current_offset, os.SEEK_SET)

4226

sdfh.seek(current_offset, os.SEEK_SET)

4227

sdfh.write(serialized_sidedata)

4227

sdfh.write(serialized_sidedata)

4228

new_entries.append(entry_update)

4228

new_entries.append(entry_update)

4229

current_offset += len(serialized_sidedata)

4229

current_offset += len(serialized_sidedata)

4230

self._docket.sidedata_end = sdfh.tell()

4230

self._docket.sidedata_end = sdfh.tell()

4231

4232

# rewrite the new index entries

4232

# rewrite the new index entries

4233

ifh.seek(startrev * self.index.entry_size)

4233

ifh.seek(startrev * self.index.entry_size)

4234

for i, e in enumerate(new_entries):

4234

for i, e in enumerate(new_entries):

4235

rev = startrev + i

4235

rev = startrev + i

4236

self.index.replace_sidedata_info(

4236

self.index.replace_sidedata_info(

4237

rev, *e

4237

rev, *e

4238

) # pytype: disable=attribute-error

4238

) # pytype: disable=attribute-error

4239

packed = self.index.entry_binary(rev)

4239

packed = self.index.entry_binary(rev)

4240

if rev == 0 and self._docket is None:

4240

if rev == 0 and self._docket is None:

4241

header = self._format_flags | self._format_version

4241

header = self._format_flags | self._format_version

4242

header = self.index.pack_header(header)

4242

header = self.index.pack_header(header)

4243

packed = header + packed

4243

packed = header + packed

4244

ifh.write(packed)

4244

ifh.write(packed)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             # coding: utf8
             #
             # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             from __future__ import annotations
             import binascii
             import collections
             import contextlib
             import io
             import os
             import struct
             import typing
             import weakref
             import zlib
             from typing import (
                 Iterable,
                 Iterator,
                 Optional,
                 Tuple,
             )
             # import stuff from node for others to import from revlog
             from .node import (
                 bin,
                 hex,
                 nullrev,
                 sha1nodeconstants,
                 short,
                 wdirrev,
             )
             from .i18n import _
             from .revlogutils.constants import (
                 ALL_KINDS,
                 CHANGELOGV2,
                 COMP_MODE_DEFAULT,
                 COMP_MODE_INLINE,
                 COMP_MODE_PLAIN,
                 DELTA_BASE_REUSE_NO,
                 DELTA_BASE_REUSE_TRY,
                 ENTRY_RANK,
                 FEATURES_BY_VERSION,
                 FLAG_GENERALDELTA,
                 FLAG_INLINE_DATA,
                 INDEX_HEADER,
                 KIND_CHANGELOG,
                 KIND_FILELOG,
                 RANK_UNKNOWN,
                 REVLOGV0,
                 REVLOGV1,
                 REVLOGV1_FLAGS,
                 REVLOGV2,
                 REVLOGV2_FLAGS,
                 REVLOG_DEFAULT_FLAGS,
                 REVLOG_DEFAULT_FORMAT,
                 REVLOG_DEFAULT_VERSION,
                 SUPPORTED_FLAGS,
             )
             from .revlogutils.flagutil import (
                 REVIDX_DEFAULT_FLAGS,
                 REVIDX_ELLIPSIS,
                 REVIDX_EXTSTORED,
                 REVIDX_FLAGS_ORDER,
                 REVIDX_HASCOPIESINFO,
                 REVIDX_ISCENSORED,
                 REVIDX_RAWTEXT_CHANGING_FLAGS,
             )
             from .thirdparty import attr
             # Force pytype to use the non-vendored package
             if typing.TYPE_CHECKING:
                 # noinspection PyPackageRequirements
                 import attr
                 from .pure.parsers import BaseIndexObject
             from . import (
                 ancestor,
                 dagop,
                 error,
                 mdiff,
                 policy,
                 pycompat,
                 revlogutils,
                 templatefilters,
                 util,
                 vfs as vfsmod,
             )
             from .interfaces import (
                 repository,
             )
             from .revlogutils import (
                 deltas as deltautil,
                 docket as docketutil,
                 flagutil,
                 nodemap as nodemaputil,
                 randomaccessfile,
                 revlogv0,
                 rewrite,
                 sidedata as sidedatautil,
             )
             from .utils import (
                 storageutil,
                 stringutil,
             )
             # blanked usage of all the name to prevent pyflakes constraints
             # We need these name available in the module for extensions.
             REVLOGV0
             REVLOGV1
             REVLOGV2
             CHANGELOGV2
             FLAG_INLINE_DATA
             FLAG_GENERALDELTA
             REVLOG_DEFAULT_FLAGS
             REVLOG_DEFAULT_FORMAT
             REVLOG_DEFAULT_VERSION
             REVLOGV1_FLAGS
             REVLOGV2_FLAGS
             REVIDX_ISCENSORED
             REVIDX_ELLIPSIS
             REVIDX_HASCOPIESINFO
             REVIDX_EXTSTORED
             REVIDX_DEFAULT_FLAGS
             REVIDX_FLAGS_ORDER
             REVIDX_RAWTEXT_CHANGING_FLAGS
             parsers = policy.importmod('parsers')
-            rustancestor = policy.importrust('ancestor')
+            rustancestor = policy.importrust('ancestor', pyo3=True)
             rustdagop = policy.importrust('dagop', pyo3=True)
             rustrevlog = policy.importrust('revlog')
             # Aliased for performance.
             _zlibdecompress = zlib.decompress
             # max size of inline data embedded into a revlog
             _maxinline = 131072
             # Flag processors for REVIDX_ELLIPSIS.
             def ellipsisreadprocessor(rl, text):
                 return text, False
             def ellipsiswriteprocessor(rl, text):
                 return text, False
             def ellipsisrawprocessor(rl, text):
                 return False
             ellipsisprocessor = (
                 ellipsisreadprocessor,
                 ellipsiswriteprocessor,
                 ellipsisrawprocessor,
             )
             def _verify_revision(rl, skipflags, state, node):
                 """Verify the integrity of the given revlog ``node`` while providing a hook
                 point for extensions to influence the operation."""
                 if skipflags:
                     state[b'skipread'].add(node)
                 else:
                     # Side-effect: read content and verify hash.
                     rl.revision(node)
             # True if a fast implementation for persistent-nodemap is available
             #
             # We also consider we have a "fast" implementation in "pure" python because
             # people using pure don't really have performance consideration (and a
             # wheelbarrow of other slowness source)
             HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(
                 parsers, 'BaseIndexObject'
             )
             @attr.s(slots=True)
             class revlogrevisiondelta(repository.irevisiondelta):
                 node = attr.ib(type=bytes)
                 p1node = attr.ib(type=bytes)
                 p2node = attr.ib(type=bytes)
                 basenode = attr.ib(type=bytes)
                 flags = attr.ib(type=int)
                 baserevisionsize = attr.ib(type=Optional[int])
                 revision = attr.ib(type=Optional[bytes])
                 delta = attr.ib(type=Optional[bytes])
                 sidedata = attr.ib(type=Optional[bytes])
                 protocol_flags = attr.ib(type=int)
                 linknode = attr.ib(default=None, type=Optional[bytes])
             @attr.s(frozen=True)
             class revlogproblem(repository.iverifyproblem):
                 warning = attr.ib(default=None, type=Optional[bytes])
                 error = attr.ib(default=None, type=Optional[bytes])
                 node = attr.ib(default=None, type=Optional[bytes])
             def parse_index_v1(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline)
                 return index, cache
             def parse_index_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)
                 return index, cache
             def parse_index_cl_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)
                 return index, cache
             if hasattr(parsers, 'parse_index_devel_nodemap'):
                 def parse_index_v1_nodemap(data, inline):
                     index, cache = parsers.parse_index_devel_nodemap(data, inline)
                     return index, cache
             else:
                 parse_index_v1_nodemap = None
             def parse_index_v1_rust(data, inline, default_header):
                 cache = (0, data) if inline else None
                 return rustrevlog.Index(data, default_header), cache
             # corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
             # signed integer)
             _maxentrysize = 0x7FFFFFFF
             FILE_TOO_SHORT_MSG = _(
                 b'cannot read from revlog %s;'
                 b'  expected %d bytes from offset %d, data size is %d'
             )
             hexdigits = b'0123456789abcdefABCDEF'
             class _Config:
                 def copy(self):
                     return self.__class__(**self.__dict__)
             @attr.s()
             class FeatureConfig(_Config):
                 """Hold configuration values about the available revlog features"""
                 # the default compression engine
                 compression_engine = attr.ib(default=b'zlib')
                 # compression engines options
                 compression_engine_options = attr.ib(default=attr.Factory(dict))
                 # can we use censor on this revlog
                 censorable = attr.ib(default=False)
                 # does this revlog use the "side data" feature
                 has_side_data = attr.ib(default=False)
                 # might remove rank configuration once the computation has no impact
                 compute_rank = attr.ib(default=False)
                 # parent order is supposed to be semantically irrelevant, so we
                 # normally resort parents to ensure that the first parent is non-null,
                 # if there is a non-null parent at all.
                 # filelog abuses the parent order as flag to mark some instances of
                 # meta-encoded files, so allow it to disable this behavior.
                 canonical_parent_order = attr.ib(default=False)
                 # can ellipsis commit be used
                 enable_ellipsis = attr.ib(default=False)
                 def copy(self):
                     new = super().copy()
                     new.compression_engine_options = self.compression_engine_options.copy()
                     return new
             @attr.s()
             class DataConfig(_Config):
                 """Hold configuration value about how the revlog data are read"""
                 # should we try to open the "pending" version of the revlog
                 try_pending = attr.ib(default=False)
                 # should we try to open the "splitted" version of the revlog
                 try_split = attr.ib(default=False)
                 #  When True, indexfile should be opened with checkambig=True at writing,
                 #  to avoid file stat ambiguity.
                 check_ambig = attr.ib(default=False)
                 # If true, use mmap instead of reading to deal with large index
                 mmap_large_index = attr.ib(default=False)
                 # how much data is large
                 mmap_index_threshold = attr.ib(default=None)
                 # How much data to read and cache into the raw revlog data cache.
                 chunk_cache_size = attr.ib(default=65536)
                 # The size of the uncompressed cache compared to the largest revision seen.
                 uncompressed_cache_factor = attr.ib(default=None)
                 # The number of chunk cached
                 uncompressed_cache_count = attr.ib(default=None)
                 # Allow sparse reading of the revlog data
                 with_sparse_read = attr.ib(default=False)
                 # minimal density of a sparse read chunk
                 sr_density_threshold = attr.ib(default=0.50)
                 # minimal size of data we skip when performing sparse read
                 sr_min_gap_size = attr.ib(default=262144)
                 # are delta encoded against arbitrary bases.
                 generaldelta = attr.ib(default=False)
             @attr.s()
             class DeltaConfig(_Config):
                 """Hold configuration value about how new delta are computed
                 Some attributes are duplicated from DataConfig to help havign each object
                 self contained.
                 """
                 # can delta be encoded against arbitrary bases.
                 general_delta = attr.ib(default=False)
                 # Allow sparse writing of the revlog data
                 sparse_revlog = attr.ib(default=False)
                 # maximum length of a delta chain
                 max_chain_len = attr.ib(default=None)
                 # Maximum distance between delta chain base start and end
                 max_deltachain_span = attr.ib(default=-1)
                 # If `upper_bound_comp` is not None, this is the expected maximal gain from
                 # compression for the data content.
                 upper_bound_comp = attr.ib(default=None)
                 # Should we try a delta against both parent
                 delta_both_parents = attr.ib(default=True)
                 # Test delta base candidate group by chunk of this maximal size.
                 candidate_group_chunk_size = attr.ib(default=0)
                 # Should we display debug information about delta computation
                 debug_delta = attr.ib(default=False)
                 # trust incoming delta by default
                 lazy_delta = attr.ib(default=True)
                 # trust the base of incoming delta by default
                 lazy_delta_base = attr.ib(default=False)
             class _InnerRevlog:
                 """An inner layer of the revlog object
                 That layer exist to be able to delegate some operation to Rust, its
                 boundaries are arbitrary and based on what we can delegate to Rust.
                 """
                 opener: vfsmod.vfs
                 def __init__(
                     self,
                     opener: vfsmod.vfs,
                     index,
                     index_file,
                     data_file,
                     sidedata_file,
                     inline,
                     data_config,
                     delta_config,
                     feature_config,
                     chunk_cache,
                     default_compression_header,
                 ):
                     self.opener = opener
                     self.index: BaseIndexObject = index
                     self.index_file = index_file
                     self.data_file = data_file
                     self.sidedata_file = sidedata_file
                     self.inline = inline
                     self.data_config = data_config
                     self.delta_config = delta_config
                     self.feature_config = feature_config
                     # used during diverted write.
                     self._orig_index_file = None
                     self._default_compression_header = default_compression_header
                     # index
                     # 3-tuple of file handles being used for active writing.
                     self._writinghandles = None
                     self._segmentfile = randomaccessfile.randomaccessfile(
                         self.opener,
                         (self.index_file if self.inline else self.data_file),
                         self.data_config.chunk_cache_size,
                         chunk_cache,
                     )
                     self._segmentfile_sidedata = randomaccessfile.randomaccessfile(
                         self.opener,
                         self.sidedata_file,
                         self.data_config.chunk_cache_size,
                     )
                     # revlog header -> revlog compressor
                     self._decompressors = {}
                     # 3-tuple of (node, rev, text) for a raw revision.
                     self._revisioncache = None
                     # cache some uncompressed chunks
                     # rev → uncompressed_chunk
                     #
                     # the max cost is dynamically updated to be proportionnal to the
                     # size of revision we actually encounter.
                     self._uncompressed_chunk_cache = None
                     if self.data_config.uncompressed_cache_factor is not None:
                         self._uncompressed_chunk_cache = util.lrucachedict(
                             self.data_config.uncompressed_cache_count,
                             maxcost=65536,  # some arbitrary initial value
                         )
                     self._delay_buffer = None
                 def __len__(self):
                     return len(self.index)
                 def clear_cache(self):
                     assert not self.is_delaying
                     self._revisioncache = None
                     if self._uncompressed_chunk_cache is not None:
                         self._uncompressed_chunk_cache.clear()
                     self._segmentfile.clear_cache()
                     self._segmentfile_sidedata.clear_cache()
                 @property
                 def canonical_index_file(self):
                     if self._orig_index_file is not None:
                         return self._orig_index_file
                     return self.index_file
                 @property
                 def is_delaying(self):
                     """is the revlog is currently delaying the visibility of written data?
                     The delaying mechanism can be either in-memory or written on disk in a
                     side-file."""
                     return (self._delay_buffer is not None) or (
                         self._orig_index_file is not None
                     )
                 # Derived from index values.
                 def start(self, rev):
                     """the offset of the data chunk for this revision"""
                     return int(self.index[rev][0] >> 16)
                 def length(self, rev):
                     """the length of the data chunk for this revision"""
                     return self.index[rev][1]
                 def end(self, rev):
                     """the end of the data chunk for this revision"""
                     return self.start(rev) + self.length(rev)
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self.delta_config.general_delta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     if not self.delta_config.sparse_revlog:
                         return self.deltaparent(rev) == nullrev
                     elif hasattr(self.index, 'issnapshot'):
                         # directly assign the method to cache the testing and access
                         self.issnapshot = self.index.issnapshot
                         return self.issnapshot(rev)
                     if rev == nullrev:
                         return True
                     entry = self.index[rev]
                     base = entry[3]
                     if base == rev:
                         return True
                     if base == nullrev:
                         return True
                     p1 = entry[5]
                     while self.length(p1) == 0:
                         b = self.deltaparent(p1)
                         if b == p1:
                             break
                         p1 = b
                     p2 = entry[6]
                     while self.length(p2) == 0:
                         b = self.deltaparent(p2)
                         if b == p2:
                             break
                         p2 = b
                     if base == p1 or base == p2:
                         return False
                     return self.issnapshot(base)
                 def _deltachain(self, rev, stoprev=None):
                     """Obtain the delta chain for a revision.
                     ``stoprev`` specifies a revision to stop at. If not specified, we
                     stop at the base of the chain.
                     Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
                     revs in ascending order and ``stopped`` is a bool indicating whether
                     ``stoprev`` was hit.
                     """
                     generaldelta = self.delta_config.general_delta
                     # Try C implementation.
                     try:
                         return self.index.deltachain(
                             rev, stoprev, generaldelta
                         )  # pytype: disable=attribute-error
                     except AttributeError:
                         pass
                     chain = []
                     # Alias to prevent attribute lookup in tight loop.
                     index = self.index
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != stoprev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == stoprev:
                         stopped = True
                     else:
                         chain.append(iterrev)
                         stopped = False
                     chain.reverse()
                     return chain, stopped
                 @util.propertycache
                 def _compressor(self):
                     engine = util.compengines[self.feature_config.compression_engine]
                     return engine.revlogcompressor(
                         self.feature_config.compression_engine_options
                     )
                 @util.propertycache
                 def _decompressor(self):
                     """the default decompressor"""
                     if self._default_compression_header is None:
                         return None
                     t = self._default_compression_header
                     c = self._get_decompressor(t)
                     return c.decompress
                 def _get_decompressor(self, t: bytes):
                     try:
                         compressor = self._decompressors[t]
                     except KeyError:
                         try:
                             engine = util.compengines.forrevlogheader(t)
                             compressor = engine.revlogcompressor(
                                 self.feature_config.compression_engine_options
                             )
                             self._decompressors[t] = compressor
                         except KeyError:
                             raise error.RevlogError(
                                 _(b'unknown compression type %s') % binascii.hexlify(t)
                             )
                     return compressor
                 def compress(self, data: bytes) -> Tuple[bytes, bytes]:
                     """Generate a possibly-compressed representation of data."""
                     if not data:
                         return b'', data
                     compressed = self._compressor.compress(data)
                     if compressed:
                         # The revlog compressor added the header in the returned data.
                         return b'', compressed
                     if data[0:1] == b'\0':
                         return b'', data
                     return b'u', data
                 def decompress(self, data: bytes):
                     """Decompress a revlog chunk.
                     The chunk is expected to begin with a header identifying the
                     format type so it can be routed to an appropriate decompressor.
                     """
                     if not data:
                         return data
                     # Revlogs are read much more frequently than they are written and many
                     # chunks only take microseconds to decompress, so performance is
                     # important here.
                     #
                     # We can make a few assumptions about revlogs:
                     #
                     # 1) the majority of chunks will be compressed (as opposed to inline
                     #    raw data).
                     # 2) decompressing *any* data will likely by at least 10x slower than
                     #    returning raw inline data.
                     # 3) we want to prioritize common and officially supported compression
                     #    engines
                     #
                     # It follows that we want to optimize for "decompress compressed data
                     # when encoded with common and officially supported compression engines"
                     # case over "raw data" and "data encoded by less common or non-official
                     # compression engines." That is why we have the inline lookup first
                     # followed by the compengines lookup.
                     #
                     # According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
                     # compressed chunks. And this matters for changelog and manifest reads.
                     t = data[0:1]
                     if t == b'x':
                         try:
                             return _zlibdecompress(data)
                         except zlib.error as e:
                             raise error.RevlogError(
                                 _(b'revlog decompress error: %s')
                                 % stringutil.forcebytestr(e)
                             )
                     # '\0' is more common than 'u' so it goes first.
                     elif t == b'\0':
                         return data
                     elif t == b'u':
                         return util.buffer(data, 1)
                     compressor = self._get_decompressor(t)
                     return compressor.decompress(data)
                 @contextlib.contextmanager
                 def reading(self):
                     """Context manager that keeps data and sidedata files open for reading"""
                     if len(self.index) == 0:
                         yield  # nothing to be read
                     elif self._delay_buffer is not None and self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     else:
                         with self._segmentfile.reading():
                             with self._segmentfile_sidedata.reading():
                                 yield
                 @property
                 def is_writing(self):
                     """True is a writing context is open"""
                     return self._writinghandles is not None
                 @property
                 def is_open(self):
                     """True if any file handle is being held
                     Used for assert and debug in the python code"""
                     return self._segmentfile.is_open or self._segmentfile_sidedata.is_open
                 @contextlib.contextmanager
                 def writing(self, transaction, data_end=None, sidedata_end=None):
                     """Open the revlog files for writing
                     Add content to a revlog should be done within such context.
                     """
                     if self.is_writing:
                         yield
                     else:
                         ifh = dfh = sdfh = None
                         try:
                             r = len(self.index)
                             # opening the data file.
                             dsize = 0
                             if r:
                                 dsize = self.end(r - 1)
                             dfh = None
                             if not self.inline:
                                 try:
                                     dfh = self.opener(self.data_file, mode=b"r+")
                                     if data_end is None:
                                         dfh.seek(0, os.SEEK_END)
                                     else:
                                         dfh.seek(data_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     dfh = self.opener(self.data_file, mode=b"w+")
                                 transaction.add(self.data_file, dsize)
                             if self.sidedata_file is not None:
                                 assert sidedata_end is not None
                                 # revlog-v2 does not inline, help Pytype
                                 assert dfh is not None
                                 try:
                                     sdfh = self.opener(self.sidedata_file, mode=b"r+")
                                     dfh.seek(sidedata_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     sdfh = self.opener(self.sidedata_file, mode=b"w+")
                                 transaction.add(self.sidedata_file, sidedata_end)
                             # opening the index file.
                             isize = r * self.index.entry_size
                             ifh = self.__index_write_fp()
                             if self.inline:
                                 transaction.add(self.index_file, dsize + isize)
                             else:
                                 transaction.add(self.index_file, isize)
                             # exposing all file handle for writing.
                             self._writinghandles = (ifh, dfh, sdfh)
                             self._segmentfile.writing_handle = ifh if self.inline else dfh
                             self._segmentfile_sidedata.writing_handle = sdfh
                             yield
                         finally:
                             self._writinghandles = None
                             self._segmentfile.writing_handle = None
                             self._segmentfile_sidedata.writing_handle = None
                             if dfh is not None:
                                 dfh.close()
                             if sdfh is not None:
                                 sdfh.close()
                             # closing the index file last to avoid exposing referent to
                             # potential unflushed data content.
                             if ifh is not None:
                                 ifh.close()
                 def __index_write_fp(self, index_end=None):
                     """internal method to open the index file for writing
                     You should not use this directly and use `_writing` instead
                     """
                     try:
                         if self._delay_buffer is None:
                             f = self.opener(
                                 self.index_file,
                                 mode=b"r+",
                                 checkambig=self.data_config.check_ambig,
                             )
                         else:
                             # check_ambig affect we way we open file for writing, however
                             # here, we do not actually open a file for writting as write
                             # will appened to a delay_buffer. So check_ambig is not
                             # meaningful and unneeded here.
                             f = randomaccessfile.appender(
                                 self.opener, self.index_file, b"r+", self._delay_buffer
                             )
                         if index_end is None:
                             f.seek(0, os.SEEK_END)
                         else:
                             f.seek(index_end, os.SEEK_SET)
                         return f
                     except FileNotFoundError:
                         if self._delay_buffer is None:
                             return self.opener(
                                 self.index_file,
                                 mode=b"w+",
                                 checkambig=self.data_config.check_ambig,
                             )
                         else:
                             return randomaccessfile.appender(
                                 self.opener, self.index_file, b"w+", self._delay_buffer
                             )
                 def __index_new_fp(self):
                     """internal method to create a new index file for writing
                     You should not use this unless you are upgrading from inline revlog
                     """
                     return self.opener(
                         self.index_file,
                         mode=b"w",
                         checkambig=self.data_config.check_ambig,
                     )
                 def split_inline(self, tr, header, new_index_file_path=None):
                     """split the data of an inline revlog into an index and a data file"""
                     assert self._delay_buffer is None
                     existing_handles = False
                     if self._writinghandles is not None:
                         existing_handles = True
                         fp = self._writinghandles[0]
                         fp.flush()
                         fp.close()
                         # We can't use the cached file handle after close(). So prevent
                         # its usage.
                         self._writinghandles = None
                         self._segmentfile.writing_handle = None
                         # No need to deal with sidedata writing handle as it is only
                         # relevant with revlog-v2 which is never inline, not reaching
                         # this code
                     new_dfh = self.opener(self.data_file, mode=b"w+")
                     new_dfh.truncate(0)  # drop any potentially existing data
                     try:
                         with self.reading():
                             for r in range(len(self.index)):
                                 new_dfh.write(self.get_segment_for_revs(r, r)[1])
                             new_dfh.flush()
                         if new_index_file_path is not None:
                             self.index_file = new_index_file_path
                         with self.__index_new_fp() as fp:
                             self.inline = False
                             for i in range(len(self.index)):
                                 e = self.index.entry_binary(i)
                                 if i == 0:
                                     packed_header = self.index.pack_header(header)
                                     e = packed_header + e
                                 fp.write(e)
                             # If we don't use side-write, the temp file replace the real
                             # index when we exit the context manager
                         self._segmentfile = randomaccessfile.randomaccessfile(
                             self.opener,
                             self.data_file,
                             self.data_config.chunk_cache_size,
                         )
                         if existing_handles:
                             # switched from inline to conventional reopen the index
                             ifh = self.__index_write_fp()
                             self._writinghandles = (ifh, new_dfh, None)
                             self._segmentfile.writing_handle = new_dfh
                             new_dfh = None
                             # No need to deal with sidedata writing handle as it is only
                             # relevant with revlog-v2 which is never inline, not reaching
                             # this code
                     finally:
                         if new_dfh is not None:
                             new_dfh.close()
                     return self.index_file
                 def get_segment_for_revs(self, startrev, endrev):
                     """Obtain a segment of raw data corresponding to a range of revisions.
                     Accepts the start and end revisions and an optional already-open
                     file handle to be used for reading. If the file handle is read, its
                     seek position will not be preserved.
                     Requests for data may be satisfied by a cache.
                     Returns a 2-tuple of (offset, data) for the requested range of
                     revisions. Offset is the integer offset from the beginning of the
                     revlog and data is a str or buffer of the raw byte data.
                     Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
                     to determine where each revision's data begins and ends.
                     API: we should consider making this a private part of the InnerRevlog
                     at some point.
                     """
                     # Inlined self.start(startrev) & self.end(endrev) for perf reasons
                     # (functions are expensive).
                     index = self.index
                     istart = index[startrev]
                     start = int(istart[0] >> 16)
                     if startrev == endrev:
                         end = start + istart[1]
                     else:
                         iend = index[endrev]
                         end = int(iend[0] >> 16) + iend[1]
                     if self.inline:
                         start += (startrev + 1) * self.index.entry_size
                         end += (endrev + 1) * self.index.entry_size
                     length = end - start
                     return start, self._segmentfile.read_chunk(start, length)
                 def _chunk(self, rev):
                     """Obtain a single decompressed chunk for a revision.
                     Accepts an integer revision and an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will not
                     be preserved.
                     Returns a str holding uncompressed data for the requested revision.
                     """
                     if self._uncompressed_chunk_cache is not None:
                         uncomp = self._uncompressed_chunk_cache.get(rev)
                         if uncomp is not None:
                             return uncomp
                     compression_mode = self.index[rev][10]
                     data = self.get_segment_for_revs(rev, rev)[1]
                     if compression_mode == COMP_MODE_PLAIN:
                         uncomp = data
                     elif compression_mode == COMP_MODE_DEFAULT:
                         uncomp = self._decompressor(data)
                     elif compression_mode == COMP_MODE_INLINE:
                         uncomp = self.decompress(data)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= compression_mode
                         raise error.RevlogError(msg)
                     if self._uncompressed_chunk_cache is not None:
                         self._uncompressed_chunk_cache.insert(rev, uncomp, cost=len(uncomp))
                     return uncomp
                 def _chunks(self, revs, targetsize=None):
                     """Obtain decompressed chunks for the specified revisions.
                     Accepts an iterable of numeric revisions that are assumed to be in
                     ascending order.
                     This function is similar to calling ``self._chunk()`` multiple times,
                     but is faster.
                     Returns a list with decompressed data for each requested revision.
                     """
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self.inline
                     iosize = self.index.entry_size
                     buffer = util.buffer
                     fetched_revs = []
                     fadd = fetched_revs.append
                     chunks = []
                     ladd = chunks.append
                     if self._uncompressed_chunk_cache is None:
                         fetched_revs = revs
                     else:
                         for rev in revs:
                             cached_value = self._uncompressed_chunk_cache.get(rev)
                             if cached_value is None:
                                 fadd(rev)
                             else:
                                 ladd((rev, cached_value))
                     if not fetched_revs:
                         slicedchunks = ()
                     elif not self.data_config.with_sparse_read:
                         slicedchunks = (fetched_revs,)
                     else:
                         slicedchunks = deltautil.slicechunk(
                             self,
                             fetched_revs,
                             targetsize=targetsize,
                         )
                     for revschunk in slicedchunks:
                         firstrev = revschunk[0]
                         # Skip trailing revisions with empty diff
                         for lastrev in revschunk[::-1]:
                             if length(lastrev) != 0:
                                 break
                         try:
                             offset, data = self.get_segment_for_revs(firstrev, lastrev)
                         except OverflowError:
                             # issue4215 - we can't cache a run of chunks greater than
                             # 2G on Windows
                             for rev in revschunk:
                                 ladd((rev, self._chunk(rev)))
                         decomp = self.decompress
                         # self._decompressor might be None, but will not be used in that case
                         def_decomp = self._decompressor
                         for rev in revschunk:
                             chunkstart = start(rev)
                             if inline:
                                 chunkstart += (rev + 1) * iosize
                             chunklength = length(rev)
                             comp_mode = self.index[rev][10]
                             c = buffer(data, chunkstart - offset, chunklength)
                             if comp_mode == COMP_MODE_PLAIN:
                                 c = c
                             elif comp_mode == COMP_MODE_INLINE:
                                 c = decomp(c)
                             elif comp_mode == COMP_MODE_DEFAULT:
                                 c = def_decomp(c)
                             else:
                                 msg = b'unknown compression mode %d'
                                 msg %= comp_mode
                                 raise error.RevlogError(msg)
                             ladd((rev, c))
                             if self._uncompressed_chunk_cache is not None:
                                 self._uncompressed_chunk_cache.insert(rev, c, len(c))
                     chunks.sort()
                     return [x[1] for x in chunks]
                 def raw_text(self, node, rev) -> bytes:
                     """return the possibly unvalidated rawtext for a revision
                     returns rawtext
                     """
                     # revision in the cache (could be useful to apply delta)
                     cachedrev = None
                     # An intermediate text to apply deltas to
                     basetext = None
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._revisioncache:
                         cachedrev = self._revisioncache[1]
                     chain, stopped = self._deltachain(rev, stoprev=cachedrev)
                     if stopped:
                         basetext = self._revisioncache[2]
                     # drop cache to save memory, the caller is expected to
                     # update self._inner._revisioncache after validating the text
                     self._revisioncache = None
                     targetsize = None
                     rawsize = self.index[rev][2]
                     if 0 <= rawsize:
                         targetsize = 4 * rawsize
                     if self._uncompressed_chunk_cache is not None:
                         # dynamically update the uncompressed_chunk_cache size to the
                         # largest revision we saw in this revlog.
                         factor = self.data_config.uncompressed_cache_factor
                         candidate_size = rawsize * factor
                         if candidate_size > self._uncompressed_chunk_cache.maxcost:
                             self._uncompressed_chunk_cache.maxcost = candidate_size
                     bins = self._chunks(chain, targetsize=targetsize)
                     if basetext is None:
                         basetext = bytes(bins[0])
                         bins = bins[1:]
                     rawtext = mdiff.patches(basetext, bins)
                     del basetext  # let us have a chance to free memory early
                     return rawtext
                 def sidedata(self, rev, sidedata_end):
                     """Return the sidedata for a given revision number."""
                     index_entry = self.index[rev]
                     sidedata_offset = index_entry[8]
                     sidedata_size = index_entry[9]
                     if self.inline:
                         sidedata_offset += self.index.entry_size * (1 + rev)
                     if sidedata_size == 0:
                         return {}
                     if sidedata_end < sidedata_offset + sidedata_size:
                         filename = self.sidedata_file
                         end = sidedata_end
                         offset = sidedata_offset
                         length = sidedata_size
                         m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)
                         raise error.RevlogError(m)
                     comp_segment = self._segmentfile_sidedata.read_chunk(
                         sidedata_offset, sidedata_size
                     )
                     comp = self.index[rev][11]
                     if comp == COMP_MODE_PLAIN:
                         segment = comp_segment
                     elif comp == COMP_MODE_DEFAULT:
                         segment = self._decompressor(comp_segment)
                     elif comp == COMP_MODE_INLINE:
                         segment = self.decompress(comp_segment)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= comp
                         raise error.RevlogError(msg)
                     sidedata = sidedatautil.deserialize_sidedata(segment)
                     return sidedata
                 def write_entry(
                     self,
                     transaction,
                     entry,
                     data,
                     link,
                     offset,
                     sidedata,
                     sidedata_offset,
                     index_end,
                     data_end,
                     sidedata_end,
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     if self._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     ifh, dfh, sdfh = self._writinghandles
                     if index_end is None:
                         ifh.seek(0, os.SEEK_END)
                     else:
                         ifh.seek(index_end, os.SEEK_SET)
                     if dfh:
                         if data_end is None:
                             dfh.seek(0, os.SEEK_END)
                         else:
                             dfh.seek(data_end, os.SEEK_SET)
                     if sdfh:
                         sdfh.seek(sidedata_end, os.SEEK_SET)
                     curr = len(self.index) - 1
                     if not self.inline:
                         transaction.add(self.data_file, offset)
                         if self.sidedata_file:
                             transaction.add(self.sidedata_file, sidedata_offset)
                         transaction.add(self.canonical_index_file, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         if sidedata:
                             sdfh.write(sidedata)
                         if self._delay_buffer is None:
                             ifh.write(entry)
                         else:
                             self._delay_buffer.append(entry)
                     elif self._delay_buffer is not None:
                         msg = b'invalid delayed write on inline revlog'
                         raise error.ProgrammingError(msg)
                     else:
                         offset += curr * self.index.entry_size
                         transaction.add(self.canonical_index_file, offset)
                         assert not sidedata
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                     return (
                         ifh.tell(),
                         dfh.tell() if dfh else None,
                         sdfh.tell() if sdfh else None,
                     )
                 def _divert_index(self):
                     index_file = self.index_file
                     # when we encounter a legacy inline-changelog, split it. However it is
                     # important to use the expected filename for pending content
                     # (<radix>.a) otherwise hooks won't be seeing the content of the
                     # pending transaction.
                     if index_file.endswith(b'.s'):
                         index_file = self.index_file[:-2]
                     return index_file + b'.a'
                 def delay(self):
                     assert not self.is_open
                     if self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     if self._delay_buffer is not None or self._orig_index_file is not None:
                         # delay or divert already in place
                         return None
                     elif len(self.index) == 0:
                         self._orig_index_file = self.index_file
                         self.index_file = self._divert_index()
                         assert self._orig_index_file is not None
                         assert self.index_file is not None
                         if self.opener.exists(self.index_file):
                             self.opener.unlink(self.index_file)
                         return self.index_file
                     else:
                         self._delay_buffer = []
                         return None
                 def write_pending(self):
                     assert not self.is_open
                     if self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     if self._orig_index_file is not None:
                         return None, True
                     any_pending = False
                     pending_index_file = self._divert_index()
                     if self.opener.exists(pending_index_file):
                         self.opener.unlink(pending_index_file)
                     util.copyfile(
                         self.opener.join(self.index_file),
                         self.opener.join(pending_index_file),
                     )
                     if self._delay_buffer:
                         with self.opener(pending_index_file, b'r+') as ifh:
                             ifh.seek(0, os.SEEK_END)
                             ifh.write(b"".join(self._delay_buffer))
                         any_pending = True
                     self._delay_buffer = None
                     self._orig_index_file = self.index_file
                     self.index_file = pending_index_file
                     return self.index_file, any_pending
                 def finalize_pending(self):
                     assert not self.is_open
                     if self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     delay = self._delay_buffer is not None
                     divert = self._orig_index_file is not None
                     if delay and divert:
                         assert False, "unreachable"
                     elif delay:
                         if self._delay_buffer:
                             with self.opener(self.index_file, b'r+') as ifh:
                                 ifh.seek(0, os.SEEK_END)
                                 ifh.write(b"".join(self._delay_buffer))
                         self._delay_buffer = None
                     elif divert:
                         if self.opener.exists(self.index_file):
                             self.opener.rename(
                                 self.index_file,
                                 self._orig_index_file,
                                 checkambig=True,
                             )
                         self.index_file = self._orig_index_file
                         self._orig_index_file = None
                     else:
                         msg = b"not delay or divert found on this revlog"
                         raise error.ProgrammingError(msg)
                     return self.canonical_index_file
             if typing.TYPE_CHECKING:
                 # Tell Pytype what kind of object we expect
                 ProxyBase = BaseIndexObject
             else:
                 ProxyBase = object
             class RustIndexProxy(ProxyBase):
                 """Wrapper around the Rust index to fake having direct access to the index.
                 Rust enforces xor mutability (one mutable reference XOR 1..n non-mutable),
                 so we can't expose the index from Rust directly, since the `InnerRevlog`
                 already has ownership of the index. This object redirects all calls to the
                 index through the Rust-backed `InnerRevlog` glue which defines all
                 necessary forwarding methods.
                 """
                 def __init__(self, inner):
                     # Do not rename as it's being used to access the index from Rust
                     self.inner = inner
                 # TODO possibly write all index methods manually to save on overhead?
                 def __getattr__(self, name):
                     return getattr(self.inner, f"_index_{name}")
                 # Magic methods need to be defined explicitely
                 def __len__(self):
                     return self.inner._index___len__()
                 def __getitem__(self, key):
                     return self.inner._index___getitem__(key)
                 def __contains__(self, key):
                     return self.inner._index___contains__(key)
                 def __delitem__(self, key):
                     return self.inner._index___delitem__(key)
             class RustVFSWrapper:
                 """Used to wrap a Python VFS to pass it to Rust to lower the overhead of
                 calling back multiple times into Python.
                 """
                 def __init__(self, inner):
                     self.inner = inner
                 def __call__(
                     self,
                     path: bytes,
                     mode: bytes = b"rb",
                     atomictemp=False,
                     checkambig=False,
                 ):
                     fd = self.inner.__call__(
                         path=path, mode=mode, atomictemp=atomictemp, checkambig=checkambig
                     )
                     # Information that Rust needs to get ownership of the file that's
                     # being opened.
                     return (os.dup(fd.fileno()), fd._tempname if atomictemp else None)
                 def __getattr__(self, name):
                     return getattr(self.inner, name)
             class revlog:
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 If checkambig, indexfile is opened with checkambig=True at
                 writing, to avoid file stat ambiguity.
                 If mmaplargeindex is True, and an mmapindexthreshold is set, the
                 index will be mmapped rather than read if it is larger than the
                 configured threshold.
                 If censorable is True, the revlog can have censored revisions.
                 If `upperboundcomp` is not None, this is the expected maximal gain from
                 compression for the data content.
                 `concurrencychecker` is an optional function that receives 3 arguments: a
                 file handle, a filename, and an expected position. It should check whether
                 the current position in the file handle is valid, and log/warn/fail (by
                 raising).
                 See mercurial/revlogutils/contants.py for details about the content of an
                 index entry.
                 """
                 _flagserrorclass = error.RevlogError
                 _inner: "_InnerRevlog"
                 opener: vfsmod.vfs
                 @staticmethod
                 def is_inline_index(header_bytes):
                     """Determine if a revlog is inline from the initial bytes of the index"""
                     if len(header_bytes) == 0:
                         return True
                     header = INDEX_HEADER.unpack(header_bytes)[0]
                     _format_flags = header & ~0xFFFF
                     _format_version = header & 0xFFFF
                     features = FEATURES_BY_VERSION[_format_version]
                     return features[b'inline'](_format_flags)
                 _docket_file: Optional[bytes]
                 def __init__(
                     self,
                     opener: vfsmod.vfs,
                     target,
                     radix,
                     postfix=None,  # only exist for `tmpcensored` now
                     checkambig=False,
                     mmaplargeindex=False,
                     censorable=False,
                     upperboundcomp=None,
                     persistentnodemap=False,
                     concurrencychecker=None,
                     trypending=False,
                     try_split=False,
                     canonical_parent_order=True,
                     data_config=None,
                     delta_config=None,
                     feature_config=None,
                     may_inline=True,  # may inline new revlog
                 ):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     `target`: a (KIND, ID) tuple that identify the content stored in
                     this revlog. It help the rest of the code to understand what the revlog
                     is about without having to resort to heuristic and index filename
                     analysis. Note: that this must be reliably be set by normal code, but
                     that test, debug, or performance measurement code might not set this to
                     accurate value.
                     """
                     self.radix = radix
                     self._docket_file = None
                     self._indexfile = None
                     self._datafile = None
                     self._sidedatafile = None
                     self._nodemap_file = None
                     self.postfix = postfix
                     self._trypending = trypending
                     self._try_split = try_split
                     self._may_inline = may_inline
                     self.uses_rust = False
                     self.opener = opener
                     if persistentnodemap:
                         self._nodemap_file = nodemaputil.get_nodemap_file(self)
                     assert target[0] in ALL_KINDS
                     assert len(target) == 2
                     self.target = target
                     if feature_config is not None:
                         self.feature_config = feature_config.copy()
                     elif b'feature-config' in self.opener.options:
                         self.feature_config = self.opener.options[b'feature-config'].copy()
                     else:
                         self.feature_config = FeatureConfig()
                     self.feature_config.censorable = censorable
                     self.feature_config.canonical_parent_order = canonical_parent_order
                     if data_config is not None:
                         self.data_config = data_config.copy()
                     elif b'data-config' in self.opener.options:
                         self.data_config = self.opener.options[b'data-config'].copy()
                     else:
                         self.data_config = DataConfig()
                     self.data_config.check_ambig = checkambig
                     self.data_config.mmap_large_index = mmaplargeindex
                     if delta_config is not None:
                         self.delta_config = delta_config.copy()
                     elif b'delta-config' in self.opener.options:
                         self.delta_config = self.opener.options[b'delta-config'].copy()
                     else:
                         self.delta_config = DeltaConfig()
                     self.delta_config.upper_bound_comp = upperboundcomp
                     # Maps rev to chain base rev.
                     self._chainbasecache = util.lrucachedict(100)
                     self.index: Optional[BaseIndexObject] = None
                     self._docket = None
                     self._nodemap_docket = None
                     # Mapping of partial identifiers to full nodes.
                     self._pcache = {}
                     # other optionnals features
                     # Make copy of flag processors so each revlog instance can support
                     # custom flags.
                     self._flagprocessors = dict(flagutil.flagprocessors)
                     # prevent nesting of addgroup
                     self._adding_group = None
                     index, chunk_cache = self._loadindex()
                     self._load_inner(index, chunk_cache)
                     self._concurrencychecker = concurrencychecker
                 def _init_opts(self):
                     """process options (from above/config) to setup associated default revlog mode
                     These values might be affected when actually reading on disk information.
                     The relevant values are returned for use in _loadindex().
                     * newversionflags:
                         version header to use if we need to create a new revlog
                     * mmapindexthreshold:
                         minimal index size for start to use mmap
                     * force_nodemap:
                         force the usage of a "development" version of the nodemap code
                     """
                     opts = self.opener.options
                     if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:
                         new_header = CHANGELOGV2
                         compute_rank = opts.get(b'changelogv2.compute-rank', True)
                         self.feature_config.compute_rank = compute_rank
                     elif b'revlogv2' in opts:
                         new_header = REVLOGV2
                     elif b'revlogv1' in opts:
                         new_header = REVLOGV1
                         if self._may_inline:
                             new_header |= FLAG_INLINE_DATA
                         if b'generaldelta' in opts:
                             new_header |= FLAG_GENERALDELTA
                     elif b'revlogv0' in self.opener.options:
                         new_header = REVLOGV0
                     else:
                         new_header = REVLOG_DEFAULT_VERSION
                     mmapindexthreshold = None
                     if self.data_config.mmap_large_index:
                         mmapindexthreshold = self.data_config.mmap_index_threshold
                     if self.feature_config.enable_ellipsis:
                         self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor
                     # revlog v0 doesn't have flag processors
                     for flag, processor in opts.get(b'flagprocessors', {}).items():
                         flagutil.insertflagprocessor(flag, processor, self._flagprocessors)
                     chunk_cache_size = self.data_config.chunk_cache_size
                     if chunk_cache_size <= 0:
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not greater than 0')
                             % chunk_cache_size
                         )
                     elif chunk_cache_size & (chunk_cache_size - 1):
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not a power of 2')
                             % chunk_cache_size
                         )
                     force_nodemap = opts.get(b'devel-force-nodemap', False)
                     return new_header, mmapindexthreshold, force_nodemap
                 def _get_data(self, filepath, mmap_threshold, size=None):
                     """return a file content with or without mmap
                     If the file is missing return the empty string"""
                     try:
                         with self.opener(filepath) as fp:
                             if mmap_threshold is not None:
                                 file_size = self.opener.fstat(fp).st_size
                                 if (
                                     file_size >= mmap_threshold
                                     and self.opener.is_mmap_safe(filepath)
                                 ):
                                     if size is not None:
                                         # avoid potentiel mmap crash
                                         size = min(file_size, size)
                                     # TODO: should .close() to release resources without
                                     # relying on Python GC
                                     if size is None:
                                         return util.buffer(util.mmapread(fp))
                                     else:
                                         return util.buffer(util.mmapread(fp, size))
                             if size is None:
                                 return fp.read()
                             else:
                                 return fp.read(size)
                     except FileNotFoundError:
                         return b''
                 def get_streams(self, max_linkrev, force_inline=False):
                     """return a list of streams that represent this revlog
                     This is used by stream-clone to do bytes to bytes copies of a repository.
                     This streams data for all revisions that refer to a changelog revision up
                     to `max_linkrev`.
                     If `force_inline` is set, it enforces that the stream will represent an inline revlog.
                     It returns is a list of three-tuple:
                         [
                             (filename, bytes_stream, stream_size),
                             …
                         ]
                     """
                     n = len(self)
                     index = self.index
                     while n > 0:
                         linkrev = index[n - 1][4]
                         if linkrev < max_linkrev:
                             break
                         # note: this loop will rarely go through multiple iterations, since
                         # it only traverses commits created during the current streaming
                         # pull operation.
                         #
                         # If this become a problem, using a binary search should cap the
                         # runtime of this.
                         n = n - 1
                     if n == 0:
                         # no data to send
                         return []
                     index_size = n * index.entry_size
                     data_size = self.end(n - 1)
                     # XXX we might have been split (or stripped) since the object
                     # initialization, We need to close this race too, but having a way to
                     # pre-open the file we feed to the revlog and never closing them before
                     # we are done streaming.
                     if self._inline:
                         def get_stream():
                             with self.opener(self._indexfile, mode=b"r") as fp:
                                 yield None
                                 size = index_size + data_size
                                 if size <= 65536:
                                     yield fp.read(size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=size)
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     elif force_inline:
                         def get_stream():
                             with self.reading():
                                 yield None
                                 for rev in range(n):
                                     idx = self.index.entry_binary(rev)
                                     if rev == 0 and self._docket is None:
                                         # re-inject the inline flag
                                         header = self._format_flags
                                         header |= self._format_version
                                         header |= FLAG_INLINE_DATA
                                         header = self.index.pack_header(header)
                                         idx = header + idx
                                     yield idx
                                     yield self._inner.get_segment_for_revs(rev, rev)[1]
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     else:
                         def get_index_stream():
                             with self.opener(self._indexfile, mode=b"r") as fp:
                                 yield None
                                 if index_size <= 65536:
                                     yield fp.read(index_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=index_size)
                         def get_data_stream():
                             with self._datafp() as fp:
                                 yield None
                                 if data_size <= 65536:
                                     yield fp.read(data_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=data_size)
                         index_stream = get_index_stream()
                         next(index_stream)
                         data_stream = get_data_stream()
                         next(data_stream)
                         return [
                             (self._datafile, data_stream, data_size),
                             (self._indexfile, index_stream, index_size),
                         ]
                 def _loadindex(self, docket=None):
                     new_header, mmapindexthreshold, force_nodemap = self._init_opts()
                     if self.postfix is not None:
                         entry_point = b'%s.i.%s' % (self.radix, self.postfix)
                     elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):
                         entry_point = b'%s.i.a' % self.radix
                     elif self._try_split and self.opener.exists(self._split_index_file):
                         entry_point = self._split_index_file
                     else:
                         entry_point = b'%s.i' % self.radix
                     if docket is not None:
                         self._docket = docket
                         self._docket_file = entry_point
                     else:
                         self._initempty = True
                         entry_data = self._get_data(entry_point, mmapindexthreshold)
                         if len(entry_data) > 0:
                             header = INDEX_HEADER.unpack(entry_data[:4])[0]
                             self._initempty = False
                         else:
                             header = new_header
                         self._format_flags = header & ~0xFFFF
                         self._format_version = header & 0xFFFF
                         supported_flags = SUPPORTED_FLAGS.get(self._format_version)
                         if supported_flags is None:
                             msg = _(b'unknown version (%d) in revlog %s')
                             msg %= (self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         elif self._format_flags & ~supported_flags:
                             msg = _(b'unknown flags (%#04x) in version %d revlog %s')
                             display_flag = self._format_flags >> 16
                             msg %= (display_flag, self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         features = FEATURES_BY_VERSION[self._format_version]
                         self._inline = features[b'inline'](self._format_flags)
                         self.delta_config.general_delta = features[b'generaldelta'](
                             self._format_flags
                         )
                         self.data_config.generaldelta = self.delta_config.general_delta
                         self.feature_config.has_side_data = features[b'sidedata']
                         if not features[b'docket']:
                             self._indexfile = entry_point
                             index_data = entry_data
                         else:
                             self._docket_file = entry_point
                             if self._initempty:
                                 self._docket = docketutil.default_docket(self, header)
                             else:
                                 self._docket = docketutil.parse_docket(
                                     self, entry_data, use_pending=self._trypending
                                 )
                     if self._docket is not None:
                         self._indexfile = self._docket.index_filepath()
                         index_data = b''
                         index_size = self._docket.index_end
                         if index_size > 0:
                             index_data = self._get_data(
                                 self._indexfile, mmapindexthreshold, size=index_size
                             )
                             if len(index_data) < index_size:
                                 msg = _(b'too few index data for %s: got %d, expected %d')
                                 msg %= (self.display_id, len(index_data), index_size)
                                 raise error.RevlogError(msg)
                         self._inline = False
                         # generaldelta implied by version 2 revlogs.
                         self.delta_config.general_delta = True
                         self.data_config.generaldelta = True
                         # the logic for persistent nodemap will be dealt with within the
                         # main docket, so disable it for now.
                         self._nodemap_file = None
                     if self._docket is not None:
                         self._datafile = self._docket.data_filepath()
                         self._sidedatafile = self._docket.sidedata_filepath()
                     elif self.postfix is None:
                         self._datafile = b'%s.d' % self.radix
                     else:
                         self._datafile = b'%s.d.%s' % (self.radix, self.postfix)
                     self.nodeconstants = sha1nodeconstants
                     self.nullid = self.nodeconstants.nullid
                     # sparse-revlog can't be on without general-delta (issue6056)
                     if not self.delta_config.general_delta:
                         self.delta_config.sparse_revlog = False
                     self._storedeltachains = True
                     devel_nodemap = (
                         self._nodemap_file
                         and force_nodemap
                         and parse_index_v1_nodemap is not None
                     )
                     use_rust_index = False
                     rust_applicable = self._nodemap_file is not None
                     rust_applicable = rust_applicable or self.target[0] == KIND_FILELOG
                     rust_applicable = rust_applicable and getattr(
                         self.opener, "rust_compatible", True
                     )
                     if rustrevlog is not None and rust_applicable:
                         # we would like to use the rust_index in all case, especially
                         # because it is necessary for AncestorsIterator and LazyAncestors
                         # since the 6.7 cycle.
                         #
                         # However, the performance impact of inconditionnaly building the
                         # nodemap is currently a problem for non-persistent nodemap
                         # repository.
                         use_rust_index = True
                         if self._format_version != REVLOGV1:
                             use_rust_index = False
                     if hasattr(self.opener, "fncache"):
                         vfs = self.opener.vfs
                         if not self.opener.uses_dotencode:
                             use_rust_index = False
                         if not isinstance(vfs, vfsmod.vfs):
                             # Be cautious since we don't support other vfs
                             use_rust_index = False
                     else:
                         # Rust only supports repos with fncache
                         use_rust_index = False
                     self._parse_index = parse_index_v1
                     if self._format_version == REVLOGV0:
                         self._parse_index = revlogv0.parse_index_v0
                     elif self._format_version == REVLOGV2:
                         self._parse_index = parse_index_v2
                     elif self._format_version == CHANGELOGV2:
                         self._parse_index = parse_index_cl_v2
                     elif devel_nodemap:
                         self._parse_index = parse_index_v1_nodemap
                     if use_rust_index:
                         # Let the Rust code parse its own index
                         index, chunkcache = (index_data, None)
                         self.uses_rust = True
                     else:
                         try:
                             d = self._parse_index(index_data, self._inline)
                             index, chunkcache = d
                             self._register_nodemap_info(index)
                         except (ValueError, IndexError):
                             raise error.RevlogError(
                                 _(b"index %s is corrupted") % self.display_id
                             )
                     # revnum -> (chain-length, sum-delta-length)
                     self._chaininfocache = util.lrucachedict(500)
                     return index, chunkcache
                 def _load_inner(self, index, chunk_cache):
                     if self._docket is None:
                         default_compression_header = None
                     else:
                         default_compression_header = self._docket.default_compression_header
                     if self.uses_rust:
                         vfs_is_readonly = False
                         fncache = None
                         if hasattr(self.opener, "vfs"):
                             vfs = self.opener
                             if isinstance(vfs, vfsmod.readonlyvfs):
                                 vfs_is_readonly = True
                                 vfs = vfs.vfs
                             fncache = vfs.fncache
                             vfs = vfs.vfs
                         else:
                             vfs = self.opener
                         vfs_base = vfs.base
                         assert fncache is not None, "Rust only supports repos with fncache"
                         self._inner = rustrevlog.InnerRevlog(
                             vfs_base=vfs_base,
                             fncache=fncache,
                             vfs_is_readonly=vfs_is_readonly,
                             index_data=index,
                             index_file=self._indexfile,
                             data_file=self._datafile,
                             sidedata_file=self._sidedatafile,
                             inline=self._inline,
                             data_config=self.data_config,
                             delta_config=self.delta_config,
                             feature_config=self.feature_config,
                             chunk_cache=chunk_cache,
                             default_compression_header=default_compression_header,
                             revlog_type=self.target[0],
                             use_persistent_nodemap=self._nodemap_file is not None,
                         )
                         self.index = RustIndexProxy(self._inner)
                         self._register_nodemap_info(self.index)
                         self.uses_rust = True
                     else:
                         self._inner = _InnerRevlog(
                             opener=self.opener,
                             index=index,
                             index_file=self._indexfile,
                             data_file=self._datafile,
                             sidedata_file=self._sidedatafile,
                             inline=self._inline,
                             data_config=self.data_config,
                             delta_config=self.delta_config,
                             feature_config=self.feature_config,
                             chunk_cache=chunk_cache,
                             default_compression_header=default_compression_header,
                         )
                         self.index = self._inner.index
                 def _register_nodemap_info(self, index):
                     use_nodemap = (
                         not self._inline
                         and self._nodemap_file is not None
                         and hasattr(index, 'update_nodemap_data')
                     )
                     if use_nodemap:
                         nodemap_data = nodemaputil.persisted_data(self)
                         if nodemap_data is not None:
                             docket = nodemap_data[0]
                             if (
                                 len(index) > docket.tip_rev
                                 and index[docket.tip_rev][7] == docket.tip_node
                             ):
                                 # no changelog tampering
                                 self._nodemap_docket = docket
                                 index.update_nodemap_data(
                                     *nodemap_data
                                 )  # pytype: disable=attribute-error
                 def get_revlog(self):
                     """simple function to mirror API of other not-really-revlog API"""
                     return self
                 @util.propertycache
                 def revlog_kind(self):
                     return self.target[0]
                 @util.propertycache
                 def display_id(self):
                     """The public facing "ID" of the revlog that we use in message"""
                     if self.revlog_kind == KIND_FILELOG:
                         # Reference the file without the "data/" prefix, so it is familiar
                         # to the user.
                         return self.target[1]
                     else:
                         return self.radix
                 def _datafp(self, mode=b'r'):
                     """file object for the revlog's data file"""
                     return self.opener(self._datafile, mode=mode)
                 def tiprev(self):
                     return len(self.index) - 1
                 def tip(self):
                     return self.node(self.tiprev())
                 def __contains__(self, rev):
                     return 0 <= rev < len(self)
                 def __len__(self):
                     return len(self.index)
                 def __iter__(self) -> Iterator[int]:
                     return iter(range(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     return storageutil.iterrevs(len(self), start=start, stop=stop)
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def _candelta(self, baserev, rev):
                     """whether two revisions (baserev, rev) can be delta-ed or not"""
                     # Disable delta if either rev requires a content-changing flag
                     # processor (ex. LFS). This is because such flag processor can alter
                     # the rawtext content that the delta will be based on, and two clients
                     # could have a same revlog node with different flags (i.e. different
                     # rawtext contents) and the delta could be incompatible.
                     if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (
                         self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS
                     ):
                         return False
                     return True
                 def update_caches(self, transaction):
                     """update on disk cache
                     If a transaction is passed, the update may be delayed to transaction
                     commit."""
                     if self._nodemap_file is not None:
                         if transaction is None:
                             nodemaputil.update_persistent_nodemap(self)
                         else:
                             nodemaputil.setup_persistent_nodemap(transaction, self)
                 def clearcaches(self, clear_persisted_data: bool = False) -> None:
                     """Clear in-memory caches"""
                     self._chainbasecache.clear()
                     self._inner.clear_cache()
                     self._pcache = {}
                     self._nodemap_docket = None
                     self.index.clearcaches()
                     # The python code is the one responsible for validating the docket, we
                     # end up having to refresh it here.
                     use_nodemap = (
                         not self._inline
                         and self._nodemap_file is not None
                         and hasattr(self.index, 'update_nodemap_data')
                     )
                     if use_nodemap:
                         nodemap_data = nodemaputil.persisted_data(self)
                         if nodemap_data is not None:
                             self._nodemap_docket = nodemap_data[0]
                             self.index.update_nodemap_data(
                                 *nodemap_data
                             )  # pytype: disable=attribute-error
                 def rev(self, node):
                     """return the revision number associated with a <nodeid>"""
                     try:
                         return self.index.rev(node)
                     except TypeError:
                         raise
                     except error.RevlogError:
                         # parsers.c radix tree lookup failed
                         if (
                             node == self.nodeconstants.wdirid
                             or node in self.nodeconstants.wdirfilenodeids
                         ):
                             raise error.WdirUnsupported
                         raise error.LookupError(node, self.display_id, _(b'no node'))
                 # Accessors for index entries.
                 # First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
                 # are flags.
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def sidedata_cut_off(self, rev):
                     sd_cut_off = self.index[rev][8]
                     if sd_cut_off != 0:
                         return sd_cut_off
                     # This is some annoying dance, because entries without sidedata
                     # currently use 0 as their ofsset. (instead of previous-offset +
                     # previous-size)
                     #
                     # We should reconsider this sidedata → 0 sidata_offset policy.
                     # In the meantime, we need this.
                     while 0 <= rev:
                         e = self.index[rev]
                         if e[9] != 0:
                             return e[8] + e[9]
                         rev -= 1
                     return 0
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def length(self, rev):
                     return self.index[rev][1]
                 def sidedata_length(self, rev):
                     if not self.feature_config.has_side_data:
                         return 0
                     return self.index[rev][9]
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.rawdata(rev)
                     return len(t)
                 def size(self, rev):
                     """length of non-raw text (processed by a "read" flag processor)"""
                     # fast path: if no "read" flag processor could change the content,
                     # size is rawsize. note: ELLIPSIS is known to not change the content.
                     flags = self.flags(rev)
                     if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
                         return self.rawsize(rev)
                     return len(self.revision(rev))
                 def fast_rank(self, rev):
                     """Return the rank of a revision if already known, or None otherwise.
                     The rank of a revision is the size of the sub-graph it defines as a
                     head. Equivalently, the rank of a revision `r` is the size of the set
                     `ancestors(r)`, `r` included.
                     This method returns the rank retrieved from the revlog in constant
                     time. It makes no attempt at computing unknown values for versions of
                     the revlog which do not persist the rank.
                     """
                     rank = self.index[rev][ENTRY_RANK]
                     if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:
                         return None
                     if rev == nullrev:
                         return 0  # convention
                     return rank
                 def chainbase(self, rev):
                     base = self._chainbasecache.get(rev)
                     if base is not None:
                         return base
                     index = self.index
                     iterrev = rev
                     base = index[iterrev][3]
                     while base != iterrev:
                         iterrev = base
                         base = index[iterrev][3]
                     self._chainbasecache[rev] = base
                     return base
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parentrevs(self, rev):
                     try:
                         entry = self.index[rev]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                     if self.feature_config.canonical_parent_order and entry[5] == nullrev:
                         return entry[6], entry[5]
                     else:
                         return entry[5], entry[6]
                 # fast parentrevs(rev) where rev isn't filtered
                 _uncheckedparentrevs = parentrevs
                 def node(self, rev):
                     try:
                         return self.index[rev][7]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                 # Derived from index values.
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     # inline node() to avoid function call overhead
                     if self.feature_config.canonical_parent_order and d[5] == self.nullid:
                         return i[d[6]][7], i[d[5]][7]
                     else:
                         return i[d[5]][7], i[d[6]][7]
                 def chainlen(self, rev):
                     return self._chaininfo(rev)[0]
                 def _chaininfo(self, rev):
                     chaininfocache = self._chaininfocache
                     if rev in chaininfocache:
                         return chaininfocache[rev]
                     index = self.index
                     generaldelta = self.delta_config.general_delta
                     iterrev = rev
                     e = index[iterrev]
                     clen = 0
                     compresseddeltalen = 0
                     while iterrev != e[3]:
                         clen += 1
                         compresseddeltalen += e[1]
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         if iterrev in chaininfocache:
                             t = chaininfocache[iterrev]
                             clen += t[0]
                             compresseddeltalen += t[1]
                             break
                         e = index[iterrev]
                     else:
                         # Add text length of base since decompressing that also takes
                         # work. For cache hits the length is already included.
                         compresseddeltalen += e[1]
                     r = (clen, compresseddeltalen)
                     chaininfocache[rev] = r
                     return r
                 def _deltachain(self, rev, stoprev=None):
                     return self._inner._deltachain(rev, stoprev=stoprev)
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse revision order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     # first, make sure start revisions aren't filtered
                     revs = list(revs)
                     checkrev = self.node
                     for r in revs:
                         checkrev(r)
                     # and we're sure ancestors aren't filtered as well
                     if rustancestor is not None and self.index.rust_ext_compat:
                         lazyancestors = rustancestor.LazyAncestors
                         arg = self.index
                     else:
                         lazyancestors = ancestor.lazyancestors
                         arg = self._uncheckedparentrevs
                     return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)
                 def descendants(self, revs):
                     return dagop.descendantrevs(revs, self.revs, self.parentrevs)
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset:
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = collections.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(miss) for miss in missing]
                 def incrementalmissingrevs(self, common=None):
                     """Return an object that can be used to incrementally compute the
                     revision numbers of the ancestors of arbitrary sets that are not
                     ancestors of common. This is an ancestor.incrementalmissingancestors
                     object.
                     'common' is a list of revision numbers. If common is not supplied, uses
                     nullrev.
                     """
                     if common is None:
                         common = [nullrev]
                     if rustancestor is not None and self.index.rust_ext_compat:
                         return rustancestor.MissingAncestors(self.index, common)
                     return ancestor.incrementalmissingancestors(self.parentrevs, common)
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     inc = self.incrementalmissingrevs(common=common)
                     return inc.missingancestors(heads)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     inc = self.incrementalmissingrevs(common=common)
                     return [self.node(r) for r in inc.missingancestors(heads)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [self.nullid]  # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return (
                             [self.node(r) for r in self],
                             [self.nullid],
                             list(self.heads()),
                         )
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == self.nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n)  # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update(
                                         [p for p in self.parents(n) if p != self.nullid]
                                     )
                                 elif n in heads:  # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [root for root in roots if root in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(root) for root in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [self.nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [head for head, flag in heads.items() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self, revs=None, stop_rev=None):
                     if revs is None:
                         return self.index.headrevs(None, stop_rev)
                     if rustdagop is not None and self.index.rust_ext_compat:
                         return rustdagop.headrevs(self.index, revs)
                     return dagop.headrevs(revs, self._uncheckedparentrevs)
                 def headrevsdiff(self, start, stop):
                     try:
                         return self.index.headrevsdiff(
                             start, stop
                         )  # pytype: disable=attribute-error
                     except AttributeError:
                         return dagop.headrevsdiff(self._uncheckedparentrevs, start, stop)
                 def computephases(self, roots):
                     return self.index.computephasesmapsets(
                         roots
                     )  # pytype: disable=attribute-error
                 def _head_node_ids(self):
                     try:
                         return self.index.head_node_ids()  # pytype: disable=attribute-error
                     except AttributeError:
                         return [self.node(r) for r in self.headrevs()]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [self.nullid]
                         return self._head_node_ids()
                     if start is None:
                         start = nullrev
                     else:
                         start = self.rev(start)
                     stoprevs = {self.rev(n) for n in stop or []}
                     revs = dagop.headrevssubset(
                         self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs
                     )
                     return [self.node(rev) for rev in revs]
                 def diffheads(self, start, stop):
                     """return the nodes that make up the difference between
                     heads of revs before `start` and heads of revs before `stop`"""
                     removed, added = self.headrevsdiff(start, stop)
                     return [self.node(r) for r in removed], [self.node(r) for r in added]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     ancs = self._commonancestorsheads(a, b)
                     return pycompat.maplist(self.node, ancs)
                 def _commonancestorsheads(self, *revs):
                     """calculate all the heads of the common ancestors of revs"""
                     try:
                         ancs = self.index.commonancestorsheads(
                             *revs
                         )  # pytype: disable=attribute-error
                     except (AttributeError, OverflowError):  # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
                     return ancs
                 def isancestor(self, a, b):
                     """return True if node a is an ancestor of node b
                     A revision is considered an ancestor of itself."""
                     a, b = self.rev(a), self.rev(b)
                     return self.isancestorrev(a, b)
                 def isancestorrev(self, a, b):
                     """return True if revision a is an ancestor of revision b
                     A revision is considered an ancestor of itself.
                     The implementation of this is trivial but the use of
                     reachableroots is not."""
                     if a == nullrev:
                         return True
                     elif a == b:
                         return True
                     elif a > b:
                         return False
                     return bool(self.reachableroots(a, [b], [a], includepath=False))
                 def reachableroots(self, minroot, heads, roots, includepath=False):
                     """return (heads(::(<roots> and <roots>::<heads>)))
                     If includepath is True, return (<roots>::<heads>)."""
                     try:
                         return self.index.reachableroots2(
                             minroot, heads, roots, includepath
                         )  # pytype: disable=attribute-error
                     except AttributeError:
                         return dagop._reachablerootspure(
                             self.parentrevs, minroot, roots, heads, includepath
                         )
                 def ancestor(self, a, b):
                     """calculate the "best" common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)  # pytype: disable=attribute-error
                     except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
                         return min(map(self.node, ancs))
                     return self.nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == self.nodeconstants.nodelen:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node)  # quick search the index
                             return node
                         except error.LookupError:
                             pass  # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if b"%d" % rev != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 2 * self.nodeconstants.nodelen:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (binascii.Error, error.LookupError):
                             pass
                 def _partialmatch(self, id):
                     # we don't care wdirfilenodeids as they should be always full hash
                     maybewdir = self.nodeconstants.wdirhex.startswith(id)
                     ambiguous = False
                     try:
                         partial = self.index.partialmatch(
                             id
                         )  # pytype: disable=attribute-error
                         if partial and self.hasnode(partial):
                             if maybewdir:
                                 # single 'ff...' match in radix tree, ambiguous with wdir
                                 ambiguous = True
                             else:
                                 return partial
                         elif maybewdir:
                             # no 'ff...' match in radix tree, wdir identified
                             raise error.WdirUnsupported
                         else:
                             return None
                     except error.RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fast path: for unfiltered changelog, radix tree is accurate
                         if not getattr(self, 'filteredrevs', None):
                             ambiguous = True
                         # fall through to slow path that filters hidden revisions
                     except (AttributeError, ValueError):
                         # we are pure python, or key is not hex
                         pass
                     if ambiguous:
                         raise error.AmbiguousPrefixLookupError(
                             id, self.display_id, _(b'ambiguous identifier')
                         )
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) <= 40:
                         # hex(node)[:...]
                         l = len(id) // 2 * 2  # grab an even number of digits
                         try:
                             # we're dropping the last digit, so let's check that it's hex,
                             # to avoid the expensive computation below if it's not
                             if len(id) % 2 > 0:
                                 if not (id[-1] in hexdigits):
                                     return None
                             prefix = bin(id[:l])
                         except binascii.Error:
                             pass
                         else:
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [
                                 n for n in nl if hex(n).startswith(id) and self.hasnode(n)
                             ]
                             if self.nodeconstants.nullhex.startswith(id):
                                 nl.append(self.nullid)
                             if len(nl) > 0:
                                 if len(nl) == 1 and not maybewdir:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise error.AmbiguousPrefixLookupError(
                                     id, self.display_id, _(b'ambiguous identifier')
                                 )
                             if maybewdir:
                                 raise error.WdirUnsupported
                             return None
                 def lookup(self, id):
                     """locate a node based on:
                     - revision number or str(revision number)
                     - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise error.LookupError(id, self.display_id, _(b'no match found'))
                 def shortest(self, node, minlength=1):
                     """Find the shortest unambiguous prefix that matches node."""
                     def isvalid(prefix):
                         try:
                             matchednode = self._partialmatch(prefix)
                         except error.AmbiguousPrefixLookupError:
                             return False
                         except error.WdirUnsupported:
                             # single 'ff...' match
                             return True
                         if matchednode is None:
                             raise error.LookupError(node, self.display_id, _(b'no node'))
                         return True
                     def maybewdir(prefix):
                         return all(c == b'f' for c in pycompat.iterbytestr(prefix))
                     hexnode = hex(node)
                     def disambiguate(hexnode, minlength):
                         """Disambiguate against wdirid."""
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if not maybewdir(prefix):
                                 return prefix
                     if not getattr(self, 'filteredrevs', None):
                         try:
                             shortest = self.index.shortest(
                                 node
                             )  # pytype: disable=attribute-error
                             length = max(shortest, minlength)
                             return disambiguate(hexnode, length)
                         except error.RevlogError:
                             if node != self.nodeconstants.wdirid:
                                 raise error.LookupError(
                                     node, self.display_id, _(b'no node')
                                 )
                         except AttributeError:
                             # Fall through to pure code
                             pass
                     if node == self.nodeconstants.wdirid:
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if isvalid(prefix):
                                 return prefix
                     for length in range(minlength, len(hexnode) + 1):
                         prefix = hexnode[:length]
                         if isvalid(prefix):
                             return disambiguate(hexnode, length)
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return storageutil.hashrevisionsha1(text, p1, p2) != node
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self.delta_config.general_delta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     ret = self._inner.issnapshot(rev)
                     self.issnapshot = self._inner.issnapshot
                     return ret
                 def snapshotdepth(self, rev):
                     """number of snapshot in the chain before this one"""
                     if not self.issnapshot(rev):
                         raise error.ProgrammingError(b'revision %d not a snapshot')
                     return len(self._inner._deltachain(rev)[0]) - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions
                     The delta calculated is in binary form and is intended to be written to
                     revlog data directly. So this function needs raw revision data.
                     """
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return bytes(self._inner._chunk(rev2))
                     return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))
                 def revision(self, nodeorrev):
                     """return an uncompressed revision of a given node or revision
                     number.
                     """
                     return self._revisiondata(nodeorrev)
                 def sidedata(self, nodeorrev):
                     """a map of extra data related to the changeset but not part of the hash
                     This function currently return a dictionary. However, more advanced
                     mapping object will likely be used in the future for a more
                     efficient/lazy code.
                     """
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                     else:
                         rev = self.rev(nodeorrev)
                     return self._sidedata(rev)
                 def _rawtext(self, node, rev):
                     """return the possibly unvalidated rawtext for a revision
                     returns (rev, rawtext, validated)
                     """
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._inner._revisioncache:
                         if self._inner._revisioncache[0] == node:
                             return (rev, self._inner._revisioncache[2], True)
                     if rev is None:
                         rev = self.rev(node)
                     text = self._inner.raw_text(node, rev)
                     return (rev, text, False)
                 def _revisiondata(self, nodeorrev, raw=False):
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     # fast path the special `nullid` rev
                     if node == self.nullid:
                         return b""
                     # ``rawtext`` is the text as stored inside the revlog. Might be the
                     # revision or might need to be processed to retrieve the revision.
                     rev, rawtext, validated = self._rawtext(node, rev)
                     if raw and validated:
                         # if we don't want to process the raw text and that raw
                         # text is cached, we can exit early.
                         return rawtext
                     if rev is None:
                         rev = self.rev(node)
                     # the revlog's flag for this revision
                     # (usually alter its state or content)
                     flags = self.flags(rev)
                     if validated and flags == REVIDX_DEFAULT_FLAGS:
                         # no extra flags set, no flag processor runs, text = rawtext
                         return rawtext
                     if raw:
                         validatehash = flagutil.processflagsraw(self, rawtext, flags)
                         text = rawtext
                     else:
                         r = flagutil.processflagsread(self, rawtext, flags)
                         text, validatehash = r
                     if validatehash:
                         self.checkhash(text, node, rev=rev)
                     if not validated:
                         self._inner._revisioncache = (node, rev, rawtext)
                     return text
                 def _sidedata(self, rev):
                     """Return the sidedata for a given revision number."""
                     if self._sidedatafile is None:
                         return {}
                     sidedata_end = None
                     if self._docket is not None:
                         sidedata_end = self._docket.sidedata_end
                     return self._inner.sidedata(rev, sidedata_end)
                 def rawdata(self, nodeorrev):
                     """return an uncompressed raw data of a given node or revision number."""
                     return self._revisiondata(nodeorrev, raw=True)
                 def hash(self, text, p1, p2):
                     """Compute a node hash.
                     Available as a function so that subclasses can replace the hash
                     as needed.
                     """
                     return storageutil.hashrevisionsha1(text, p1, p2)
                 def checkhash(self, text, node, p1=None, p2=None, rev=None):
                     """Check node hash integrity.
                     Available as a function so that subclasses can extend hash mismatch
                     behaviors as needed.
                     """
                     try:
                         if p1 is None and p2 is None:
                             p1, p2 = self.parents(node)
                         if node != self.hash(text, p1, p2):
                             # Clear the revision cache on hash failure. The revision cache
                             # only stores the raw revision and clearing the cache does have
                             # the side-effect that we won't have a cache hit when the raw
                             # revision data is accessed. But this case should be rare and
                             # it is extra work to teach the cache about the hash
                             # verification state.
                             if (
                                 self._inner._revisioncache
                                 and self._inner._revisioncache[0] == node
                             ):
                                 self._inner._revisioncache = None
                             revornode = rev
                             if revornode is None:
                                 revornode = templatefilters.short(hex(node))
                             raise error.RevlogError(
                                 _(b"integrity check failed on %s:%s")
                                 % (self.display_id, pycompat.bytestr(revornode))
                             )
                     except error.RevlogError:
                         if self.feature_config.censorable and storageutil.iscensoredtext(
                             text
                         ):
                             raise error.CensoredNodeError(self.display_id, node, text)
                         raise
                 @property
                 def _split_index_file(self):
                     """the path where to expect the index of an ongoing splitting operation
                     The file will only exist if a splitting operation is in progress, but
                     it is always expected at the same location."""
                     parts = self.radix.split(b'/')
                     if len(parts) > 1:
                         # adds a '-s' prefix to the ``data/` or `meta/` base
                         head = parts[0] + b'-s'
                         mids = parts[1:-1]
                         tail = parts[-1] + b'.i'
                         pieces = [head] + mids + [tail]
                         return b'/'.join(pieces)
                     else:
                         # the revlog is stored at the root of the store (changelog or
                         # manifest), no risk of collision.
                         return self.radix + b'.i.s'
                 def _enforceinlinesize(self, tr):
                     """Check if the revlog is too big for inline and convert if so.
                     This should be called after revisions are added to the revlog. If the
                     revlog has grown too large to be an inline revlog, it will convert it
                     to use multiple index and data files.
                     """
                     tiprev = len(self) - 1
                     total_size = self.start(tiprev) + self.length(tiprev)
                     if not self._inline or (self._may_inline and total_size < _maxinline):
                         return
                     if self._docket is not None:
                         msg = b"inline revlog should not have a docket"
                         raise error.ProgrammingError(msg)
                     # In the common case, we enforce inline size because the revlog has
                     # been appened too. And in such case, it must have an initial offset
                     # recorded in the transaction.
                     troffset = tr.findoffset(self._inner.canonical_index_file)
                     pre_touched = troffset is not None
                     if not pre_touched and self.target[0] != KIND_CHANGELOG:
                         raise error.RevlogError(
                             _(b"%s not found in the transaction") % self._indexfile
                         )
                     tr.addbackup(self._inner.canonical_index_file, for_offset=pre_touched)
                     tr.add(self._datafile, 0)
                     new_index_file_path = None
                     old_index_file_path = self._indexfile
                     new_index_file_path = self._split_index_file
                     opener = self.opener
                     weak_self = weakref.ref(self)
                     # the "split" index replace the real index when the transaction is
                     # finalized
                     def finalize_callback(tr):
                         opener.rename(
                             new_index_file_path,
                             old_index_file_path,
                             checkambig=True,
                         )
                         maybe_self = weak_self()
                         if maybe_self is not None:
                             maybe_self._indexfile = old_index_file_path
                             maybe_self._inner.index_file = maybe_self._indexfile
                     def abort_callback(tr):
                         maybe_self = weak_self()
                         if maybe_self is not None:
                             maybe_self._indexfile = old_index_file_path
                             maybe_self._inner.inline = True
                             maybe_self._inner.index_file = old_index_file_path
                     tr.registertmp(new_index_file_path)
                     # we use 001 here to make this this happens after the finalisation of
                     # pending changelog write (using 000). Otherwise the two finalizer
                     # would step over each other and delete the changelog.i file.
                     if self.target[1] is not None:
                         callback_id = b'001-revlog-split-%d-%s' % self.target
                     else:
                         callback_id = b'001-revlog-split-%d' % self.target[0]
                     tr.addfinalize(callback_id, finalize_callback)
                     tr.addabort(callback_id, abort_callback)
                     self._format_flags &= ~FLAG_INLINE_DATA
                     self._inner.split_inline(
                         tr,
                         self._format_flags | self._format_version,
                         new_index_file_path=new_index_file_path,
                     )
                     self._inline = False
                     if new_index_file_path is not None:
                         self._indexfile = new_index_file_path
                     nodemaputil.setup_persistent_nodemap(tr, self)
                 def _nodeduplicatecallback(self, transaction, node):
                     """called when trying to add a node already stored."""
                 @contextlib.contextmanager
                 def reading(self):
                     with self._inner.reading():
                         yield
                 @contextlib.contextmanager
                 def _writing(self, transaction):
                     if self._trypending:
                         msg = b'try to write in a `trypending` revlog: %s'
                         msg %= self.display_id
                         raise error.ProgrammingError(msg)
                     if self._inner.is_writing:
                         yield
                     else:
                         data_end = None
                         sidedata_end = None
                         if self._docket is not None:
                             data_end = self._docket.data_end
                             sidedata_end = self._docket.sidedata_end
                         with self._inner.writing(
                             transaction,
                             data_end=data_end,
                             sidedata_end=sidedata_end,
                         ):
                             yield
                             if self._docket is not None:
                                 self._write_docket(transaction)
                 @property
                 def is_delaying(self):
                     return self._inner.is_delaying
                 def _write_docket(self, transaction):
                     """write the current docket on disk
                     Exist as a method to help changelog to implement transaction logic
                     We could also imagine using the same transaction logic for all revlog
                     since docket are cheap."""
                     self._docket.write(transaction)
                 def addrevision(
                     self,
                     text,
                     transaction,
                     link,
                     p1,
                     p2,
                     cachedelta=None,
                     node=None,
                     flags=REVIDX_DEFAULT_FLAGS,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     flags - the known flags to set on the revision
                     deltacomputer - an optional deltacomputer instance shared between
                         multiple calls
                     """
                     if link == nullrev:
                         raise error.RevlogError(
                             _(b"attempted to add linkrev -1 to %s") % self.display_id
                         )
                     if sidedata is None:
                         sidedata = {}
                     elif sidedata and not self.feature_config.has_side_data:
                         raise error.ProgrammingError(
                             _(b"trying to add sidedata to a revlog who don't support them")
                         )
                     if flags:
                         node = node or self.hash(text, p1, p2)
                     rawtext, validatehash = flagutil.processflagswrite(self, text, flags)
                     # If the flag processor modifies the revision data, ignore any provided
                     # cachedelta.
                     if rawtext != text:
                         cachedelta = None
                     if len(rawtext) > _maxentrysize:
                         raise error.RevlogError(
                             _(
                                 b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"
                             )
                             % (self.display_id, len(rawtext))
                         )
                     node = node or self.hash(rawtext, p1, p2)
                     rev = self.index.get_rev(node)
                     if rev is not None:
                         return rev
                     if validatehash:
                         self.checkhash(rawtext, node, p1=p1, p2=p2)
                     return self.addrawrevision(
                         rawtext,
                         transaction,
                         link,
                         p1,
                         p2,
                         node,
                         flags,
                         cachedelta=cachedelta,
                         deltacomputer=deltacomputer,
                         sidedata=sidedata,
                     )
                 def addrawrevision(
                     self,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     node,
                     flags,
                     cachedelta=None,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a raw revision with known flags, node and parents
                     useful when reusing a revision not stored in this revlog (ex: received
                     over wire, or read from an external bundle).
                     """
                     with self._writing(transaction):
                         return self._addrevision(
                             node,
                             rawtext,
                             transaction,
                             link,
                             p1,
                             p2,
                             flags,
                             cachedelta,
                             deltacomputer=deltacomputer,
                             sidedata=sidedata,
                         )
                 def compress(self, data: bytes) -> Tuple[bytes, bytes]:
                     return self._inner.compress(data)
                 def decompress(self, data):
                     return self._inner.decompress(data)
                 def _addrevision(
                     self,
                     node,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     flags,
                     cachedelta,
                     alwayscache=False,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
                     if "deltacomputer" is not provided or None, a defaultdeltacomputer will
                     be used.
                     invariants:
                     - rawtext is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     if node == self.nullid:
                         raise error.RevlogError(
                             _(b"%s: attempt to add null revision") % self.display_id
                         )
                     if (
                         node == self.nodeconstants.wdirid
                         or node in self.nodeconstants.wdirfilenodeids
                     ):
                         raise error.RevlogError(
                             _(b"%s: attempt to add wdir revision") % self.display_id
                         )
                     if not self._inner.is_writing:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     btext = [rawtext]
                     curr = len(self)
                     prev = curr - 1
                     offset = self._get_data_offset(prev)
                     if self._concurrencychecker:
                         ifh, dfh, sdfh = self._inner._writinghandles
                         # XXX no checking for the sidedata file
                         if self._inline:
                             # offset is "as if" it were in the .d file, so we need to add on
                             # the size of the entry metadata.
                             self._concurrencychecker(
                                 ifh, self._indexfile, offset + curr * self.index.entry_size
                             )
                         else:
                             # Entries in the .i are a consistent size.
                             self._concurrencychecker(
                                 ifh, self._indexfile, curr * self.index.entry_size
                             )
                             self._concurrencychecker(dfh, self._datafile, offset)
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if rawtext is None:
                         # need rawtext size, before changed by flag processors, which is
                         # the non-raw size. use revlog explicitly to avoid filelog's extra
                         # logic that might remove metadata size.
                         textlen = mdiff.patchedsize(
                             revlog.size(self, cachedelta[0]), cachedelta[1]
                         )
                     else:
                         textlen = len(rawtext)
                     if deltacomputer is None:
                         write_debug = None
                         if self.delta_config.debug_delta:
                             write_debug = transaction._report
                         deltacomputer = deltautil.deltacomputer(
                             self, write_debug=write_debug
                         )
                     if cachedelta is not None and len(cachedelta) == 2:
                         # If the cached delta has no information about how it should be
                         # reused, add the default reuse instruction according to the
                         # revlog's configuration.
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse = DELTA_BASE_REUSE_NO
                         cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)
                     revinfo = revlogutils.revisioninfo(
                         node,
                         p1,
                         p2,
                         btext,
                         textlen,
                         cachedelta,
                         flags,
                     )
                     deltainfo = deltacomputer.finddeltainfo(revinfo)
                     compression_mode = COMP_MODE_INLINE
                     if self._docket is not None:
                         default_comp = self._docket.default_compression_header
                         r = deltautil.delta_compression(default_comp, deltainfo)
                         compression_mode, deltainfo = r
                     sidedata_compression_mode = COMP_MODE_INLINE
                     if sidedata and self.feature_config.has_side_data:
                         sidedata_compression_mode = COMP_MODE_PLAIN
                         serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)
                         sidedata_offset = self._docket.sidedata_end
                         h, comp_sidedata = self._inner.compress(serialized_sidedata)
                         if (
                             h != b'u'
                             and comp_sidedata[0:1] != b'\0'
                             and len(comp_sidedata) < len(serialized_sidedata)
                         ):
                             assert not h
                             if (
                                 comp_sidedata[0:1]
                                 == self._docket.default_compression_header
                             ):
                                 sidedata_compression_mode = COMP_MODE_DEFAULT
                                 serialized_sidedata = comp_sidedata
                             else:
                                 sidedata_compression_mode = COMP_MODE_INLINE
                                 serialized_sidedata = comp_sidedata
                     else:
                         serialized_sidedata = b""
                         # Don't store the offset if the sidedata is empty, that way
                         # we can easily detect empty sidedata and they will be no different
                         # than ones we manually add.
                         sidedata_offset = 0
                     rank = RANK_UNKNOWN
                     if self.feature_config.compute_rank:
                         if (p1r, p2r) == (nullrev, nullrev):
                             rank = 1
                         elif p1r != nullrev and p2r == nullrev:
                             rank = 1 + self.fast_rank(p1r)
                         elif p1r == nullrev and p2r != nullrev:
                             rank = 1 + self.fast_rank(p2r)
                         else:  # merge node
                             if rustdagop is not None and self.index.rust_ext_compat:
                                 rank = rustdagop.rank(self.index, p1r, p2r)
                             else:
                                 pmin, pmax = sorted((p1r, p2r))
                                 rank = 1 + self.fast_rank(pmax)
                                 rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))
                     e = revlogutils.entry(
                         flags=flags,
                         data_offset=offset,
                         data_compressed_length=deltainfo.deltalen,
                         data_uncompressed_length=textlen,
                         data_compression_mode=compression_mode,
                         data_delta_base=deltainfo.base,
                         link_rev=link,
                         parent_rev_1=p1r,
                         parent_rev_2=p2r,
                         node_id=node,
                         sidedata_offset=sidedata_offset,
                         sidedata_compressed_length=len(serialized_sidedata),
                         sidedata_compression_mode=sidedata_compression_mode,
                         rank=rank,
                     )
                     self.index.append(e)
                     entry = self.index.entry_binary(curr)
                     if curr == 0 and self._docket is None:
                         header = self._format_flags | self._format_version
                         header = self.index.pack_header(header)
                         entry = header + entry
                     self._writeentry(
                         transaction,
                         entry,
                         deltainfo.data,
                         link,
                         offset,
                         serialized_sidedata,
                         sidedata_offset,
                     )
                     rawtext = btext[0]
                     if alwayscache and rawtext is None:
                         rawtext = deltacomputer.buildtext(revinfo)
                     if type(rawtext) == bytes:  # only accept immutable objects
                         self._inner._revisioncache = (node, curr, rawtext)
                     self._chainbasecache[curr] = deltainfo.chainbase
                     return curr
                 def _get_data_offset(self, prev):
                     """Returns the current offset in the (in-transaction) data file.
                     Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket
                     file to store that information: since sidedata can be rewritten to the
                     end of the data file within a transaction, you can have cases where, for
                     example, rev `n` does not have sidedata while rev `n - 1` does, leading
                     to `n - 1`'s sidedata being written after `n`'s data.
                     TODO cache this in a docket file before getting out of experimental."""
                     if self._docket is None:
                         return self.end(prev)
                     else:
                         return self._docket.data_end
                 def _writeentry(
                     self,
                     transaction,
                     entry,
                     data,
                     link,
                     offset,
                     sidedata,
                     sidedata_offset,
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     index_end = data_end = sidedata_end = None
                     if self._docket is not None:
                         index_end = self._docket.index_end
                         data_end = self._docket.data_end
                         sidedata_end = self._docket.sidedata_end
                     files_end = self._inner.write_entry(
                         transaction,
                         entry,
                         data,
                         link,
                         offset,
                         sidedata,
                         sidedata_offset,
                         index_end,
                         data_end,
                         sidedata_end,
                     )
                     self._enforceinlinesize(transaction)
                     if self._docket is not None:
                         self._docket.index_end = files_end[0]
                         self._docket.data_end = files_end[1]
                         self._docket.sidedata_end = files_end[2]
                     nodemaputil.setup_persistent_nodemap(transaction, self)
                 def addgroup(
                     self,
                     deltas,
                     linkmapper,
                     transaction,
                     alwayscache=False,
                     addrevisioncb=None,
                     duplicaterevisioncb=None,
                     debug_info=None,
                     delta_base_reuse_policy=None,
                 ):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     If ``addrevisioncb`` is defined, it will be called with arguments of
                     this revlog and the node that was added.
                     """
                     if self._adding_group:
                         raise error.ProgrammingError(b'cannot nest addgroup() calls')
                     # read the default delta-base reuse policy from revlog config if the
                     # group did not specify one.
                     if delta_base_reuse_policy is None:
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse_policy = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse_policy = DELTA_BASE_REUSE_NO
                     self._adding_group = True
                     empty = True
                     try:
                         with self._writing(transaction):
                             write_debug = None
                             if self.delta_config.debug_delta:
                                 write_debug = transaction._report
                             deltacomputer = deltautil.deltacomputer(
                                 self,
                                 write_debug=write_debug,
                                 debug_info=debug_info,
                             )
                             # loop through our set of deltas
                             for data in deltas:
                                 (
                                     node,
                                     p1,
                                     p2,
                                     linknode,
                                     deltabase,
                                     delta,
                                     flags,
                                     sidedata,
                                 ) = data
                                 link = linkmapper(linknode)
                                 flags = flags or REVIDX_DEFAULT_FLAGS
                                 rev = self.index.get_rev(node)
                                 if rev is not None:
                                     # this can happen if two branches make the same change
                                     self._nodeduplicatecallback(transaction, rev)
                                     if duplicaterevisioncb:
                                         duplicaterevisioncb(self, rev)
                                     empty = False
                                     continue
                                 for p in (p1, p2):
                                     if not self.index.has_node(p):
                                         raise error.LookupError(
                                             p, self.radix, _(b'unknown parent')
                                         )
                                 if not self.index.has_node(deltabase):
                                     raise error.LookupError(
                                         deltabase, self.display_id, _(b'unknown delta base')
                                     )
                                 baserev = self.rev(deltabase)
                                 if baserev != nullrev and self.iscensored(baserev):
                                     # if base is censored, delta must be full replacement in a
                                     # single patch operation
                                     hlen = struct.calcsize(b">lll")
                                     oldlen = self.rawsize(baserev)
                                     newlen = len(delta) - hlen
                                     if delta[:hlen] != mdiff.replacediffheader(
                                         oldlen, newlen
                                     ):
                                         raise error.CensoredBaseError(
                                             self.display_id, self.node(baserev)
                                         )
                                 if not flags and self._peek_iscensored(baserev, delta):
                                     flags |= REVIDX_ISCENSORED
                                 # We assume consumers of addrevisioncb will want to retrieve
                                 # the added revision, which will require a call to
                                 # revision(). revision() will fast path if there is a cache
                                 # hit. So, we tell _addrevision() to always cache in this case.
                                 # We're only using addgroup() in the context of changegroup
                                 # generation so the revision data can always be handled as raw
                                 # by the flagprocessor.
                                 rev = self._addrevision(
                                     node,
                                     None,
                                     transaction,
                                     link,
                                     p1,
                                     p2,
                                     flags,
                                     (baserev, delta, delta_base_reuse_policy),
                                     alwayscache=alwayscache,
                                     deltacomputer=deltacomputer,
                                     sidedata=sidedata,
                                 )
                                 if addrevisioncb:
                                     addrevisioncb(self, rev)
                                 empty = False
                     finally:
                         self._adding_group = False
                     return not empty
                 def iscensored(self, rev):
                     """Check if a file revision is censored."""
                     if not self.feature_config.censorable:
                         return False
                     return self.flags(rev) & REVIDX_ISCENSORED
                 def _peek_iscensored(self, baserev, delta):
                     """Quickly check if a delta produces a censored revision."""
                     if not self.feature_config.censorable:
                         return False
                     return storageutil.deltaiscensored(delta, baserev, self.rawsize)
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     return storageutil.resolvestripinfo(
                         minlink,
                         len(self) - 1,
                         self.headrevs(),
                         self.linkrev,
                         self.parentrevs,
                     )
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     data_end = self.start(rev)
                     if not self._inline:
                         transaction.add(self._datafile, data_end)
                         end = rev * self.index.entry_size
                     else:
                         end = data_end + (rev * self.index.entry_size)
                     if self._sidedatafile:
                         sidedata_end = self.sidedata_cut_off(rev)
                         transaction.add(self._sidedatafile, sidedata_end)
                     transaction.add(self._indexfile, end)
                     if self._docket is not None:
                         # XXX we could, leverage the docket while stripping. However it is
                         # not powerfull enough at the time of this comment
                         self._docket.index_end = end
                         self._docket.data_end = data_end
                         self._docket.sidedata_end = sidedata_end
                         self._docket.write(transaction, stripping=True)
                     # then reset internal state in memory to forget those revisions
                     self._chaininfocache = util.lrucachedict(500)
                     self._inner.clear_cache()
                     del self.index[rev:-1]
                 def checksize(self):
                     """Check size of index and data files
                     return a (dd, di) tuple.
                     - dd: extra bytes for the "data" file
                     - di: extra bytes for the "index" file
                     A healthy revlog will return (0, 0).
                     """
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         with self._datafp() as f:
                             f.seek(0, io.SEEK_END)
                             actual = f.tell()
                         dd = actual - expected
                     except FileNotFoundError:
                         dd = 0
                     try:
                         f = self.opener(self._indexfile)
                         f.seek(0, io.SEEK_END)
                         actual = f.tell()
                         f.close()
                         s = self.index.entry_size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except FileNotFoundError:
                         di = 0
                     return (dd, di)
                 def files(self):
                     """return list of files that compose this revlog"""
                     res = [self._indexfile]
                     if self._docket_file is None:
                         if not self._inline:
                             res.append(self._datafile)
                     else:
                         res.append(self._docket_file)
                         res.extend(self._docket.old_index_filepaths(include_empty=False))
                         if self._docket.data_end:
                             res.append(self._datafile)
                         res.extend(self._docket.old_data_filepaths(include_empty=False))
                         if self._docket.sidedata_end:
                             res.append(self._sidedatafile)
                         res.extend(self._docket.old_sidedata_filepaths(include_empty=False))
                     return res
                 def emitrevisions(
                     self,
                     nodes,
                     nodesorder=None,
                     revisiondata=False,
                     assumehaveparentrevisions=False,
                     deltamode=repository.CG_DELTAMODE_STD,
                     sidedata_helpers=None,
                     debug_info=None,
                 ):
                     if nodesorder not in (b'nodes', b'storage', b'linear', None):
                         raise error.ProgrammingError(
                             b'unhandled value for nodesorder: %s' % nodesorder
                         )
                     if nodesorder is None and not self.delta_config.general_delta:
                         nodesorder = b'storage'
                     if (
                         not self._storedeltachains
                         and deltamode != repository.CG_DELTAMODE_PREV
                     ):
                         deltamode = repository.CG_DELTAMODE_FULL
                     return storageutil.emitrevisions(
                         self,
                         nodes,
                         nodesorder,
                         revlogrevisiondelta,
                         deltaparentfn=self.deltaparent,
                         candeltafn=self._candelta,
                         rawsizefn=self.rawsize,
                         revdifffn=self.revdiff,
                         flagsfn=self.flags,
                         deltamode=deltamode,
                         revisiondata=revisiondata,
                         assumehaveparentrevisions=assumehaveparentrevisions,
                         sidedata_helpers=sidedata_helpers,
                         debug_info=debug_info,
                     )
                 DELTAREUSEALWAYS = b'always'
                 DELTAREUSESAMEREVS = b'samerevs'
                 DELTAREUSENEVER = b'never'
                 DELTAREUSEFULLADD = b'fulladd'
                 DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}
                 def clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb=None,
                     deltareuse=DELTAREUSESAMEREVS,
                     forcedeltabothparents=None,
                     sidedata_helpers=None,
                 ):
                     """Copy this revlog to another, possibly with format changes.
                     The destination revlog will contain the same revisions and nodes.
                     However, it may not be bit-for-bit identical due to e.g. delta encoding
                     differences.
                     The ``deltareuse`` argument control how deltas from the existing revlog
                     are preserved in the destination revlog. The argument can have the
                     following values:
                     DELTAREUSEALWAYS
                        Deltas will always be reused (if possible), even if the destination
                        revlog would not select the same revisions for the delta. This is the
                        fastest mode of operation.
                     DELTAREUSESAMEREVS
                        Deltas will be reused if the destination revlog would pick the same
                        revisions for the delta. This mode strikes a balance between speed
                        and optimization.
                     DELTAREUSENEVER
                        Deltas will never be reused. This is the slowest mode of execution.
                        This mode can be used to recompute deltas (e.g. if the diff/delta
                        algorithm changes).
                     DELTAREUSEFULLADD
                        Revision will be re-added as if their were new content. This is
                        slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.
                        eg: large file detection and handling.
                     Delta computation can be slow, so the choice of delta reuse policy can
                     significantly affect run time.
                     The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
                     two extremes. Deltas will be reused if they are appropriate. But if the
                     delta could choose a better revision, it will do so. This means if you
                     are converting a non-generaldelta revlog to a generaldelta revlog,
                     deltas will be recomputed if the delta's parent isn't a parent of the
                     revision.
                     In addition to the delta policy, the ``forcedeltabothparents``
                     argument controls whether to force compute deltas against both parents
                     for merges. By default, the current default is used.
                     See `revlogutil.sidedata.get_sidedata_helpers` for the doc on
                     `sidedata_helpers`.
                     """
                     if deltareuse not in self.DELTAREUSEALL:
                         raise ValueError(
                             _(b'value for deltareuse invalid: %s') % deltareuse
                         )
                     if len(destrevlog):
                         raise ValueError(_(b'destination revlog is not empty'))
                     if getattr(self, 'filteredrevs', None):
                         raise ValueError(_(b'source revlog has filtered revisions'))
                     if getattr(destrevlog, 'filteredrevs', None):
                         raise ValueError(_(b'destination revlog has filtered revisions'))
                     # lazydelta and lazydeltabase controls whether to reuse a cached delta,
                     # if possible.
                     old_delta_config = destrevlog.delta_config
                     destrevlog.delta_config = destrevlog.delta_config.copy()
                     try:
                         if deltareuse == self.DELTAREUSEALWAYS:
                             destrevlog.delta_config.lazy_delta_base = True
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSESAMEREVS:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSENEVER:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = False
                         delta_both_parents = (
                             forcedeltabothparents or old_delta_config.delta_both_parents
                         )
                         destrevlog.delta_config.delta_both_parents = delta_both_parents
                         with self.reading(), destrevlog._writing(tr):
                             self._clone(
                                 tr,
                                 destrevlog,
                                 addrevisioncb,
                                 deltareuse,
                                 forcedeltabothparents,
                                 sidedata_helpers,
                             )
                     finally:
                         destrevlog.delta_config = old_delta_config
                 def _clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb,
                     deltareuse,
                     forcedeltabothparents,
                     sidedata_helpers,
                 ):
                     """perform the core duty of `revlog.clone` after parameter processing"""
                     write_debug = None
                     if self.delta_config.debug_delta:
                         write_debug = tr._report
                     deltacomputer = deltautil.deltacomputer(
                         destrevlog,
                         write_debug=write_debug,
                     )
                     index = self.index
                     for rev in self:
                         entry = index[rev]
                         # Some classes override linkrev to take filtered revs into
                         # account. Use raw entry from index.
                         flags = entry[0] & 0xFFFF
                         linkrev = entry[4]
                         p1 = index[entry[5]][7]
                         p2 = index[entry[6]][7]
                         node = entry[7]
                         # (Possibly) reuse the delta from the revlog if allowed and
                         # the revlog chunk is a delta.
                         cachedelta = None
                         rawtext = None
                         if deltareuse == self.DELTAREUSEFULLADD:
                             text = self._revisiondata(rev)
                             sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             destrevlog.addrevision(
                                 text,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 cachedelta=cachedelta,
                                 node=node,
                                 flags=flags,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         else:
                             if destrevlog.delta_config.lazy_delta:
                                 dp = self.deltaparent(rev)
                                 if dp != nullrev:
                                     cachedelta = (dp, bytes(self._inner._chunk(rev)))
                             sidedata = None
                             if not cachedelta:
                                 try:
                                     rawtext = self._revisiondata(rev)
                                 except error.CensoredNodeError as censored:
                                     assert flags & REVIDX_ISCENSORED
                                     rawtext = censored.tombstone
                                 sidedata = self.sidedata(rev)
                             if sidedata is None:
                                 sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             destrevlog._addrevision(
                                 node,
                                 rawtext,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 flags,
                                 cachedelta,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         if addrevisioncb:
                             addrevisioncb(self, rev, node)
                 def censorrevision(self, tr, censor_nodes, tombstone=b''):
                     if self._format_version == REVLOGV0:
                         raise error.RevlogError(
                             _(b'cannot censor with version %d revlogs')
                             % self._format_version
                         )
                     elif self._format_version == REVLOGV1:
                         rewrite.v1_censor(self, tr, censor_nodes, tombstone)
                     else:
                         rewrite.v2_censor(self, tr, censor_nodes, tombstone)
                 def verifyintegrity(self, state) -> Iterable[repository.iverifyproblem]:
                     """Verifies the integrity of the revlog.
                     Yields ``revlogproblem`` instances describing problems that are
                     found.
                     """
                     dd, di = self.checksize()
                     if dd:
                         yield revlogproblem(error=_(b'data length off by %d bytes') % dd)
                     if di:
                         yield revlogproblem(error=_(b'index contains %d extra bytes') % di)
                     version = self._format_version
                     # The verifier tells us what version revlog we should be.
                     if version != state[b'expectedversion']:
                         yield revlogproblem(
                             warning=_(b"warning: '%s' uses revlog format %d; expected %d")
                             % (self.display_id, version, state[b'expectedversion'])
                         )
                     state[b'skipread'] = set()
                     state[b'safe_renamed'] = set()
                     for rev in self:
                         node = self.node(rev)
                         # Verify contents. 4 cases to care about:
                         #
                         #   common: the most common case
                         #   rename: with a rename
                         #   meta: file content starts with b'\1\n', the metadata
                         #         header defined in filelog.py, but without a rename
                         #   ext: content stored externally
                         #
                         # More formally, their differences are shown below:
                         #
                         #                       | common | rename | meta  | ext
                         #  -------------------------------------------------------
                         #   flags()             | 0      | 0      | 0     | not 0
                         #   renamed()           | False  | True   | False | ?
                         #   rawtext[0:2]=='\1\n'| False  | True   | True  | ?
                         #
                         # "rawtext" means the raw text stored in revlog data, which
                         # could be retrieved by "rawdata(rev)". "text"
                         # mentioned below is "revision(rev)".
                         #
                         # There are 3 different lengths stored physically:
                         #  1. L1: rawsize, stored in revlog index
                         #  2. L2: len(rawtext), stored in revlog data
                         #  3. L3: len(text), stored in revlog data if flags==0, or
                         #     possibly somewhere else if flags!=0
                         #
                         # L1 should be equal to L2. L3 could be different from them.
                         # "text" may or may not affect commit hash depending on flag
                         # processors (see flagutil.addflagprocessor).
                         #
                         #              | common  | rename | meta  | ext
                         # -------------------------------------------------
                         #    rawsize() | L1      | L1     | L1    | L1
                         #       size() | L1      | L2-LM  | L1(*) | L1 (?)
                         # len(rawtext) | L2      | L2     | L2    | L2
                         #    len(text) | L2      | L2     | L2    | L3
                         #  len(read()) | L2      | L2-LM  | L2-LM | L3 (?)
                         #
                         # LM:  length of metadata, depending on rawtext
                         # (*): not ideal, see comment in filelog.size
                         # (?): could be "- len(meta)" if the resolved content has
                         #      rename metadata
                         #
                         # Checks needed to be done:
                         #  1. length check: L1 == L2, in all cases.
                         #  2. hash check: depending on flag processor, we may need to
                         #     use either "text" (external), or "rawtext" (in revlog).
                         try:
                             skipflags = state.get(b'skipflags', 0)
                             if skipflags:
                                 skipflags &= self.flags(rev)
                             _verify_revision(self, skipflags, state, node)
                             l1 = self.rawsize(rev)
                             l2 = len(self.rawdata(node))
                             if l1 != l2:
                                 yield revlogproblem(
                                     error=_(b'unpacked size is %d, %d expected') % (l2, l1),
                                     node=node,
                                 )
                         except error.CensoredNodeError:
                             if state[b'erroroncensored']:
                                 yield revlogproblem(
                                     error=_(b'censored file data'), node=node
                                 )
                                 state[b'skipread'].add(node)
                         except Exception as e:
                             yield revlogproblem(
                                 error=_(b'unpacking %s: %s')
                                 % (short(node), stringutil.forcebytestr(e)),
                                 node=node,
                             )
                             state[b'skipread'].add(node)
                 def storageinfo(
                     self,
                     exclusivefiles=False,
                     sharedfiles=False,
                     revisionscount=False,
                     trackedsize=False,
                     storedsize=False,
                 ):
                     d = {}
                     if exclusivefiles:
                         d[b'exclusivefiles'] = [(self.opener, self._indexfile)]
                         if not self._inline:
                             d[b'exclusivefiles'].append((self.opener, self._datafile))
                     if sharedfiles:
                         d[b'sharedfiles'] = []
                     if revisionscount:
                         d[b'revisionscount'] = len(self)
                     if trackedsize:
                         d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))
                     if storedsize:
                         d[b'storedsize'] = sum(
                             self.opener.stat(path).st_size for path in self.files()
                         )
                     return d
                 def rewrite_sidedata(self, transaction, helpers, startrev, endrev):
                     if not self.feature_config.has_side_data:
                         return
                     # revlog formats with sidedata support does not support inline
                     assert not self._inline
                     if not helpers[1] and not helpers[2]:
                         # Nothing to generate or remove
                         return
                     new_entries = []
                     # append the new sidedata
                     with self._writing(transaction):
                         ifh, dfh, sdfh = self._inner._writinghandles
                         dfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                         current_offset = sdfh.tell()
                         for rev in range(startrev, endrev + 1):
                             entry = self.index[rev]
                             new_sidedata, flags = sidedatautil.run_sidedata_helpers(
                                 store=self,
                                 sidedata_helpers=helpers,
                                 sidedata={},
                                 rev=rev,
                             )
                             serialized_sidedata = sidedatautil.serialize_sidedata(
                                 new_sidedata
                             )
                             sidedata_compression_mode = COMP_MODE_INLINE
                             if serialized_sidedata and self.feature_config.has_side_data:
                                 sidedata_compression_mode = COMP_MODE_PLAIN
                                 h, comp_sidedata = self._inner.compress(serialized_sidedata)
                                 if (
                                     h != b'u'
                                     and comp_sidedata[0] != b'\0'
                                     and len(comp_sidedata) < len(serialized_sidedata)
                                 ):
                                     assert not h
                                     if (
                                         comp_sidedata[0]
                                         == self._docket.default_compression_header
                                     ):
                                         sidedata_compression_mode = COMP_MODE_DEFAULT
                                         serialized_sidedata = comp_sidedata
                                     else:
                                         sidedata_compression_mode = COMP_MODE_INLINE
                                         serialized_sidedata = comp_sidedata
                             if entry[8] != 0 or entry[9] != 0:
                                 # rewriting entries that already have sidedata is not
                                 # supported yet, because it introduces garbage data in the
                                 # revlog.
                                 msg = b"rewriting existing sidedata is not supported yet"
                                 raise error.Abort(msg)
                             # Apply (potential) flags to add and to remove after running
                             # the sidedata helpers
                             new_offset_flags = entry[0] | flags[0] & ~flags[1]
                             entry_update = (
                                 current_offset,
                                 len(serialized_sidedata),
                                 new_offset_flags,
                                 sidedata_compression_mode,
                             )
                             # the sidedata computation might have move the file cursors around
                             sdfh.seek(current_offset, os.SEEK_SET)
                             sdfh.write(serialized_sidedata)
                             new_entries.append(entry_update)
                             current_offset += len(serialized_sidedata)
                             self._docket.sidedata_end = sdfh.tell()
                         # rewrite the new index entries
                         ifh.seek(startrev * self.index.entry_size)
                         for i, e in enumerate(new_entries):
                             rev = startrev + i
                             self.index.replace_sidedata_info(
                                 rev, *e
                             )  # pytype: disable=attribute-error
                             packed = self.index.entry_binary(rev)
                             if rev == 0 and self._docket is None:
                                 header = self._format_flags | self._format_version
                                 header = self.index.pack_header(header)
                                 packed = header + packed
                             ifh.write(packed)