upstream/mercurial-mirror Commit - r52210:5b3b6db4

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

# coding: utf8

2

# coding: utf8

3

#

3

#

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

"""Storage back-end for Mercurial.

9

"""Storage back-end for Mercurial.

10

11

This provides efficient delta storage with O(1) retrieve and append

11

This provides efficient delta storage with O(1) retrieve and append

12

and O(changes) merge between branches.

12

and O(changes) merge between branches.

13

"""

13

"""

14

15

16

import binascii

16

import binascii

17

import collections

17

import collections

18

import contextlib

18

import contextlib

19

import functools

19

import functools

20

import io

20

import io

21

import os

21

import os

22

import struct

22

import struct

23

import weakref

23

import weakref

24

import zlib

24

import zlib

25

26

# import stuff from node for others to import from revlog

26

# import stuff from node for others to import from revlog

27

from .node import (

27

from .node import (

28

bin,

28

bin,

29

hex,

29

hex,

30

nullrev,

30

nullrev,

31

sha1nodeconstants,

31

sha1nodeconstants,

32

short,

32

short,

33

wdirrev,

33

wdirrev,

34

)

34

)

35

from .i18n import _

35

from .i18n import _

36

from .revlogutils.constants import (

36

from .revlogutils.constants import (

37

ALL_KINDS,

37

ALL_KINDS,

38

CHANGELOGV2,

38

CHANGELOGV2,

39

COMP_MODE_DEFAULT,

39

COMP_MODE_DEFAULT,

40

COMP_MODE_INLINE,

40

COMP_MODE_INLINE,

41

COMP_MODE_PLAIN,

41

COMP_MODE_PLAIN,

42

DELTA_BASE_REUSE_NO,

42

DELTA_BASE_REUSE_NO,

43

DELTA_BASE_REUSE_TRY,

43

DELTA_BASE_REUSE_TRY,

44

ENTRY_RANK,

44

ENTRY_RANK,

45

FEATURES_BY_VERSION,

45

FEATURES_BY_VERSION,

46

FLAG_GENERALDELTA,

46

FLAG_GENERALDELTA,

47

FLAG_INLINE_DATA,

47

FLAG_INLINE_DATA,

48

INDEX_HEADER,

48

INDEX_HEADER,

49

KIND_CHANGELOG,

49

KIND_CHANGELOG,

50

KIND_FILELOG,

50

KIND_FILELOG,

51

RANK_UNKNOWN,

51

RANK_UNKNOWN,

52

REVLOGV0,

52

REVLOGV0,

53

REVLOGV1,

53

REVLOGV1,

54

REVLOGV1_FLAGS,

54

REVLOGV1_FLAGS,

55

REVLOGV2,

55

REVLOGV2,

56

REVLOGV2_FLAGS,

56

REVLOGV2_FLAGS,

57

REVLOG_DEFAULT_FLAGS,

57

REVLOG_DEFAULT_FLAGS,

58

REVLOG_DEFAULT_FORMAT,

58

REVLOG_DEFAULT_FORMAT,

59

REVLOG_DEFAULT_VERSION,

59

REVLOG_DEFAULT_VERSION,

60

SUPPORTED_FLAGS,

60

SUPPORTED_FLAGS,

61

)

61

)

62

from .revlogutils.flagutil import (

62

from .revlogutils.flagutil import (

63

REVIDX_DEFAULT_FLAGS,

63

REVIDX_DEFAULT_FLAGS,

64

REVIDX_ELLIPSIS,

64

REVIDX_ELLIPSIS,

65

REVIDX_EXTSTORED,

65

REVIDX_EXTSTORED,

66

REVIDX_FLAGS_ORDER,

66

REVIDX_FLAGS_ORDER,

67

REVIDX_HASCOPIESINFO,

67

REVIDX_HASCOPIESINFO,

68

REVIDX_ISCENSORED,

68

REVIDX_ISCENSORED,

69

REVIDX_RAWTEXT_CHANGING_FLAGS,

69

REVIDX_RAWTEXT_CHANGING_FLAGS,

70

)

70

)

71

from .thirdparty import attr

71

from .thirdparty import attr

72

from . import (

72

from . import (

73

ancestor,

73

ancestor,

74

dagop,

74

dagop,

75

error,

75

error,

76

mdiff,

76

mdiff,

77

policy,

77

policy,

78

pycompat,

78

pycompat,

79

revlogutils,

79

revlogutils,

80

templatefilters,

80

templatefilters,

81

util,

81

util,

82

)

82

)

83

from .interfaces import (

83

from .interfaces import (

84

repository,

84

repository,

85

util as interfaceutil,

85

util as interfaceutil,

86

)

86

)

87

from .revlogutils import (

87

from .revlogutils import (

88

deltas as deltautil,

88

deltas as deltautil,

89

docket as docketutil,

89

docket as docketutil,

90

flagutil,

90

flagutil,

91

nodemap as nodemaputil,

91

nodemap as nodemaputil,

92

randomaccessfile,

92

randomaccessfile,

93

revlogv0,

93

revlogv0,

94

rewrite,

94

rewrite,

95

sidedata as sidedatautil,

95

sidedata as sidedatautil,

96

)

96

)

97

from .utils import (

97

from .utils import (

98

storageutil,

98

storageutil,

99

stringutil,

99

stringutil,

100

)

100

)

101

102

# blanked usage of all the name to prevent pyflakes constraints

102

# blanked usage of all the name to prevent pyflakes constraints

103

# We need these name available in the module for extensions.

103

# We need these name available in the module for extensions.

104

105

REVLOGV0

105

REVLOGV0

106

REVLOGV1

106

REVLOGV1

107

REVLOGV2

107

REVLOGV2

108

CHANGELOGV2

108

CHANGELOGV2

109

FLAG_INLINE_DATA

109

FLAG_INLINE_DATA

110

FLAG_GENERALDELTA

110

FLAG_GENERALDELTA

111

REVLOG_DEFAULT_FLAGS

111

REVLOG_DEFAULT_FLAGS

112

REVLOG_DEFAULT_FORMAT

112

REVLOG_DEFAULT_FORMAT

113

REVLOG_DEFAULT_VERSION

113

REVLOG_DEFAULT_VERSION

114

REVLOGV1_FLAGS

114

REVLOGV1_FLAGS

115

REVLOGV2_FLAGS

115

REVLOGV2_FLAGS

116

REVIDX_ISCENSORED

116

REVIDX_ISCENSORED

117

REVIDX_ELLIPSIS

117

REVIDX_ELLIPSIS

118

REVIDX_HASCOPIESINFO

118

REVIDX_HASCOPIESINFO

119

REVIDX_EXTSTORED

119

REVIDX_EXTSTORED

120

REVIDX_DEFAULT_FLAGS

120

REVIDX_DEFAULT_FLAGS

121

REVIDX_FLAGS_ORDER

121

REVIDX_FLAGS_ORDER

122

REVIDX_RAWTEXT_CHANGING_FLAGS

122

REVIDX_RAWTEXT_CHANGING_FLAGS

123

124

parsers = policy.importmod('parsers')

124

parsers = policy.importmod('parsers')

125

rustancestor = policy.importrust('ancestor')

125

rustancestor = policy.importrust('ancestor')

126

rustdagop = policy.importrust('dagop')

126

rustdagop = policy.importrust('dagop')

127

rustrevlog = policy.importrust('revlog')

127

rustrevlog = policy.importrust('revlog')

128

129

# Aliased for performance.

129

# Aliased for performance.

130

_zlibdecompress = zlib.decompress

130

_zlibdecompress = zlib.decompress

131

132

# max size of inline data embedded into a revlog

132

# max size of inline data embedded into a revlog

133

_maxinline = 131072

133

_maxinline = 131072

134

135

# Flag processors for REVIDX_ELLIPSIS.

135

# Flag processors for REVIDX_ELLIPSIS.

136

def ellipsisreadprocessor(rl, text):

136

def ellipsisreadprocessor(rl, text):

137

return text, False

137

return text, False

138

139

140

def ellipsiswriteprocessor(rl, text):

140

def ellipsiswriteprocessor(rl, text):

141

return text, False

141

return text, False

142

143

144

def ellipsisrawprocessor(rl, text):

144

def ellipsisrawprocessor(rl, text):

145

return False

145

return False

146

147

148

ellipsisprocessor = (

148

ellipsisprocessor = (

149

ellipsisreadprocessor,

149

ellipsisreadprocessor,

150

ellipsiswriteprocessor,

150

ellipsiswriteprocessor,

151

ellipsisrawprocessor,

151

ellipsisrawprocessor,

152

)

152

)

153

154

155

def _verify_revision(rl, skipflags, state, node):

155

def _verify_revision(rl, skipflags, state, node):

156

"""Verify the integrity of the given revlog ``node`` while providing a hook

156

"""Verify the integrity of the given revlog ``node`` while providing a hook

157

point for extensions to influence the operation."""

157

point for extensions to influence the operation."""

158

if skipflags:

158

if skipflags:

159

state[b'skipread'].add(node)

159

state[b'skipread'].add(node)

160

else:

160

else:

161

# Side-effect: read content and verify hash.

161

# Side-effect: read content and verify hash.

162

rl.revision(node)

162

rl.revision(node)

163

164

165

# True if a fast implementation for persistent-nodemap is available

165

# True if a fast implementation for persistent-nodemap is available

166

#

166

#

167

# We also consider we have a "fast" implementation in "pure" python because

167

# We also consider we have a "fast" implementation in "pure" python because

168

# people using pure don't really have performance consideration (and a

168

# people using pure don't really have performance consideration (and a

169

# wheelbarrow of other slowness source)

169

# wheelbarrow of other slowness source)

170

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

170

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

171

parsers, 'BaseIndexObject'

171

parsers, 'BaseIndexObject'

172

)

172

)

173

174

175

@interfaceutil.implementer(repository.irevisiondelta)

175

@interfaceutil.implementer(repository.irevisiondelta)

176

@attr.s(slots=True)

176

@attr.s(slots=True)

177

class revlogrevisiondelta:

177

class revlogrevisiondelta:

178

node = attr.ib()

178

node = attr.ib()

179

p1node = attr.ib()

179

p1node = attr.ib()

180

p2node = attr.ib()

180

p2node = attr.ib()

181

basenode = attr.ib()

181

basenode = attr.ib()

182

flags = attr.ib()

182

flags = attr.ib()

183

baserevisionsize = attr.ib()

183

baserevisionsize = attr.ib()

184

revision = attr.ib()

184

revision = attr.ib()

185

delta = attr.ib()

185

delta = attr.ib()

186

sidedata = attr.ib()

186

sidedata = attr.ib()

187

protocol_flags = attr.ib()

187

protocol_flags = attr.ib()

188

linknode = attr.ib(default=None)

188

linknode = attr.ib(default=None)

189

190

191

@interfaceutil.implementer(repository.iverifyproblem)

191

@interfaceutil.implementer(repository.iverifyproblem)

192

@attr.s(frozen=True)

192

@attr.s(frozen=True)

193

class revlogproblem:

193

class revlogproblem:

194

warning = attr.ib(default=None)

194

warning = attr.ib(default=None)

195

error = attr.ib(default=None)

195

error = attr.ib(default=None)

196

node = attr.ib(default=None)

196

node = attr.ib(default=None)

197

198

199

def parse_index_v1(data, inline):

199

def parse_index_v1(data, inline):

200

# call the C implementation to parse the index data

200

# call the C implementation to parse the index data

201

index, cache = parsers.parse_index2(data, inline)

201

index, cache = parsers.parse_index2(data, inline)

202

return index, cache

202

return index, cache

203

204

205

def parse_index_v2(data, inline):

205

def parse_index_v2(data, inline):

206

# call the C implementation to parse the index data

206

# call the C implementation to parse the index data

207

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

207

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

208

return index, cache

208

return index, cache

209

210

211

def parse_index_cl_v2(data, inline):

211

def parse_index_cl_v2(data, inline):

212

# call the C implementation to parse the index data

212

# call the C implementation to parse the index data

213

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

213

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

214

return index, cache

214

return index, cache

215

216

217

if hasattr(parsers, 'parse_index_devel_nodemap'):

217

if hasattr(parsers, 'parse_index_devel_nodemap'):

218

219

def parse_index_v1_nodemap(data, inline):

219

def parse_index_v1_nodemap(data, inline):

220

index, cache = parsers.parse_index_devel_nodemap(data, inline)

220

index, cache = parsers.parse_index_devel_nodemap(data, inline)

221

return index, cache

221

return index, cache

222

223

224

else:

224

else:

225

parse_index_v1_nodemap = None

225

parse_index_v1_nodemap = None

226

227

228

def parse_index_v1_rust(data, inline, default_header):

228

def parse_index_v1_rust(data, inline, default_header):

229

cache = (0, data) if inline else None

229

cache = (0, data) if inline else None

230

return rustrevlog.Index(data, default_header), cache

230

return rustrevlog.Index(data, default_header), cache

231

232

233

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

233

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

234

# signed integer)

234

# signed integer)

235

_maxentrysize = 0x7FFFFFFF

235

_maxentrysize = 0x7FFFFFFF

236

237

FILE_TOO_SHORT_MSG = _(

237

FILE_TOO_SHORT_MSG = _(

238

b'cannot read from revlog %s;'

238

b'cannot read from revlog %s;'

239

b' expected %d bytes from offset %d, data size is %d'

239

b' expected %d bytes from offset %d, data size is %d'

240

)

240

)

241

242

hexdigits = b'0123456789abcdefABCDEF'

242

hexdigits = b'0123456789abcdefABCDEF'

243

244

245

class _Config:

245

class _Config:

246

def copy(self):

246

def copy(self):

247

return self.__class__(**self.__dict__)

247

return self.__class__(**self.__dict__)

248

249

250

@attr.s()

250

@attr.s()

251

class FeatureConfig(_Config):

251

class FeatureConfig(_Config):

252

"""Hold configuration values about the available revlog features"""

252

"""Hold configuration values about the available revlog features"""

253

254

# the default compression engine

254

# the default compression engine

255

compression_engine = attr.ib(default=b'zlib')

255

compression_engine = attr.ib(default=b'zlib')

256

# compression engines options

256

# compression engines options

257

compression_engine_options = attr.ib(default=attr.Factory(dict))

257

compression_engine_options = attr.ib(default=attr.Factory(dict))

258

259

# can we use censor on this revlog

259

# can we use censor on this revlog

260

censorable = attr.ib(default=False)

260

censorable = attr.ib(default=False)

261

# does this revlog use the "side data" feature

261

# does this revlog use the "side data" feature

262

has_side_data = attr.ib(default=False)

262

has_side_data = attr.ib(default=False)

263

# might remove rank configuration once the computation has no impact

263

# might remove rank configuration once the computation has no impact

264

compute_rank = attr.ib(default=False)

264

compute_rank = attr.ib(default=False)

265

# parent order is supposed to be semantically irrelevant, so we

265

# parent order is supposed to be semantically irrelevant, so we

266

# normally resort parents to ensure that the first parent is non-null,

266

# normally resort parents to ensure that the first parent is non-null,

267

# if there is a non-null parent at all.

267

# if there is a non-null parent at all.

268

# filelog abuses the parent order as flag to mark some instances of

268

# filelog abuses the parent order as flag to mark some instances of

269

# meta-encoded files, so allow it to disable this behavior.

269

# meta-encoded files, so allow it to disable this behavior.

270

canonical_parent_order = attr.ib(default=False)

270

canonical_parent_order = attr.ib(default=False)

271

# can ellipsis commit be used

271

# can ellipsis commit be used

272

enable_ellipsis = attr.ib(default=False)

272

enable_ellipsis = attr.ib(default=False)

273

274

def copy(self):

274

def copy(self):

275

new = super().copy()

275

new = super().copy()

276

new.compression_engine_options = self.compression_engine_options.copy()

276

new.compression_engine_options = self.compression_engine_options.copy()

277

return new

277

return new

278

279

280

@attr.s()

280

@attr.s()

281

class DataConfig(_Config):

281

class DataConfig(_Config):

282

"""Hold configuration value about how the revlog data are read"""

282

"""Hold configuration value about how the revlog data are read"""

283

284

# should we try to open the "pending" version of the revlog

284

# should we try to open the "pending" version of the revlog

285

try_pending = attr.ib(default=False)

285

try_pending = attr.ib(default=False)

286

# should we try to open the "splitted" version of the revlog

286

# should we try to open the "splitted" version of the revlog

287

try_split = attr.ib(default=False)

287

try_split = attr.ib(default=False)

288

# When True, indexfile should be opened with checkambig=True at writing,

288

# When True, indexfile should be opened with checkambig=True at writing,

289

# to avoid file stat ambiguity.

289

# to avoid file stat ambiguity.

290

check_ambig = attr.ib(default=False)

290

check_ambig = attr.ib(default=False)

291

292

# If true, use mmap instead of reading to deal with large index

292

# If true, use mmap instead of reading to deal with large index

293

mmap_large_index = attr.ib(default=False)

293

mmap_large_index = attr.ib(default=False)

294

# how much data is large

294

# how much data is large

295

mmap_index_threshold = attr.ib(default=None)

295

mmap_index_threshold = attr.ib(default=None)

296

# How much data to read and cache into the raw revlog data cache.

296

# How much data to read and cache into the raw revlog data cache.

297

chunk_cache_size = attr.ib(default=65536)

297

chunk_cache_size = attr.ib(default=65536)

298

299

# The size of the uncompressed cache compared to the largest revision seen.

299

# The size of the uncompressed cache compared to the largest revision seen.

300

uncompressed_cache_factor = attr.ib(default=None)

300

uncompressed_cache_factor = attr.ib(default=None)

301

302

# The number of chunk cached

302

# The number of chunk cached

303

uncompressed_cache_count = attr.ib(default=None)

303

uncompressed_cache_count = attr.ib(default=None)

304

305

# Allow sparse reading of the revlog data

305

# Allow sparse reading of the revlog data

306

with_sparse_read = attr.ib(default=False)

306

with_sparse_read = attr.ib(default=False)

307

# minimal density of a sparse read chunk

307

# minimal density of a sparse read chunk

308

sr_density_threshold = attr.ib(default=0.50)

308

sr_density_threshold = attr.ib(default=0.50)

309

# minimal size of data we skip when performing sparse read

309

# minimal size of data we skip when performing sparse read

310

sr_min_gap_size = attr.ib(default=262144)

310

sr_min_gap_size = attr.ib(default=262144)

311

312

# are delta encoded against arbitrary bases.

312

# are delta encoded against arbitrary bases.

313

generaldelta = attr.ib(default=False)

313

generaldelta = attr.ib(default=False)

314

315

316

@attr.s()

316

@attr.s()

317

class DeltaConfig(_Config):

317

class DeltaConfig(_Config):

318

"""Hold configuration value about how new delta are computed

318

"""Hold configuration value about how new delta are computed

319

320

Some attributes are duplicated from DataConfig to help havign each object

320

Some attributes are duplicated from DataConfig to help havign each object

321

self contained.

321

self contained.

322

"""

322

"""

323

324

# can delta be encoded against arbitrary bases.

324

# can delta be encoded against arbitrary bases.

325

general_delta = attr.ib(default=False)

325

general_delta = attr.ib(default=False)

326

# Allow sparse writing of the revlog data

326

# Allow sparse writing of the revlog data

327

sparse_revlog = attr.ib(default=False)

327

sparse_revlog = attr.ib(default=False)

328

# maximum length of a delta chain

328

# maximum length of a delta chain

329

max_chain_len = attr.ib(default=None)

329

max_chain_len = attr.ib(default=None)

330

# Maximum distance between delta chain base start and end

330

# Maximum distance between delta chain base start and end

331

max_deltachain_span = attr.ib(default=-1)

331

max_deltachain_span = attr.ib(default=-1)

332

# If `upper_bound_comp` is not None, this is the expected maximal gain from

332

# If `upper_bound_comp` is not None, this is the expected maximal gain from

333

# compression for the data content.

333

# compression for the data content.

334

upper_bound_comp = attr.ib(default=None)

334

upper_bound_comp = attr.ib(default=None)

335

# Should we try a delta against both parent

335

# Should we try a delta against both parent

336

delta_both_parents = attr.ib(default=True)

336

delta_both_parents = attr.ib(default=True)

337

# Test delta base candidate group by chunk of this maximal size.

337

# Test delta base candidate group by chunk of this maximal size.

338

candidate_group_chunk_size = attr.ib(default=0)

338

candidate_group_chunk_size = attr.ib(default=0)

339

# Should we display debug information about delta computation

339

# Should we display debug information about delta computation

340

debug_delta = attr.ib(default=False)

340

debug_delta = attr.ib(default=False)

341

# trust incoming delta by default

341

# trust incoming delta by default

342

lazy_delta = attr.ib(default=True)

342

lazy_delta = attr.ib(default=True)

343

# trust the base of incoming delta by default

343

# trust the base of incoming delta by default

344

lazy_delta_base = attr.ib(default=False)

344

lazy_delta_base = attr.ib(default=False)

345

346

347

class _InnerRevlog:

347

class _InnerRevlog:

348

"""An inner layer of the revlog object

348

"""An inner layer of the revlog object

349

350

That layer exist to be able to delegate some operation to Rust, its

350

That layer exist to be able to delegate some operation to Rust, its

351

boundaries are arbitrary and based on what we can delegate to Rust.

351

boundaries are arbitrary and based on what we can delegate to Rust.

352

"""

352

"""

353

354

def __init__(

354

def __init__(

355

self,

355

self,

356

opener,

356

opener,

357

index,

357

index,

358

index_file,

358

index_file,

359

data_file,

359

data_file,

360

sidedata_file,

360

sidedata_file,

361

inline,

361

inline,

362

data_config,

362

data_config,

363

delta_config,

363

delta_config,

364

feature_config,

364

feature_config,

365

chunk_cache,

365

chunk_cache,

366

default_compression_header,

366

default_compression_header,

367

):

367

):

368

self.opener = opener

368

self.opener = opener

369

self.index = index

369

self.index = index

370

371

self.index_file = index_file

371

self.index_file = index_file

372

self.data_file = data_file

372

self.data_file = data_file

373

self.sidedata_file = sidedata_file

373

self.sidedata_file = sidedata_file

374

self.inline = inline

374

self.inline = inline

375

self.data_config = data_config

375

self.data_config = data_config

376

self.delta_config = delta_config

376

self.delta_config = delta_config

377

self.feature_config = feature_config

377

self.feature_config = feature_config

378

379

# used during diverted write.

379

# used during diverted write.

380

self._orig_index_file = None

380

self._orig_index_file = None

381

382

self._default_compression_header = default_compression_header

382

self._default_compression_header = default_compression_header

383

384

# index

384

# index

385

386

# 3-tuple of file handles being used for active writing.

386

# 3-tuple of file handles being used for active writing.

387

self._writinghandles = None

387

self._writinghandles = None

388

389

self._segmentfile = randomaccessfile.randomaccessfile(

389

self._segmentfile = randomaccessfile.randomaccessfile(

390

self.opener,

390

self.opener,

391

(self.index_file if self.inline else self.data_file),

391

(self.index_file if self.inline else self.data_file),

392

self.data_config.chunk_cache_size,

392

self.data_config.chunk_cache_size,

393

chunk_cache,

393

chunk_cache,

394

)

394

)

395

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

395

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

396

self.opener,

396

self.opener,

397

self.sidedata_file,

397

self.sidedata_file,

398

self.data_config.chunk_cache_size,

398

self.data_config.chunk_cache_size,

399

)

399

)

400

401

# revlog header -> revlog compressor

401

# revlog header -> revlog compressor

402

self._decompressors = {}

402

self._decompressors = {}

403

# 3-tuple of (node, rev, text) for a raw revision.

403

# 3-tuple of (node, rev, text) for a raw revision.

404

self._revisioncache = None

404

self._revisioncache = None

405

406

# cache some uncompressed chunks

406

# cache some uncompressed chunks

407

# rev → uncompressed_chunk

407

# rev → uncompressed_chunk

408

#

408

#

409

# the max cost is dynamically updated to be proportionnal to the

409

# the max cost is dynamically updated to be proportionnal to the

410

# size of revision we actually encounter.

410

# size of revision we actually encounter.

411

self._uncompressed_chunk_cache = None

411

self._uncompressed_chunk_cache = None

412

if self.data_config.uncompressed_cache_factor is not None:

412

if self.data_config.uncompressed_cache_factor is not None:

413

self._uncompressed_chunk_cache = util.lrucachedict(

413

self._uncompressed_chunk_cache = util.lrucachedict(

414

self.data_config.uncompressed_cache_count,

414

self.data_config.uncompressed_cache_count,

415

maxcost=65536, # some arbitrary initial value

415

maxcost=65536, # some arbitrary initial value

416

)

416

)

417

418

self._delay_buffer = None

418

self._delay_buffer = None

419

420

def __len__(self):

420

def __len__(self):

421

return len(self.index)

421

return len(self.index)

422

423

def clear_cache(self):

423

def clear_cache(self):

424

assert not self.is_delaying

424

assert not self.is_delaying

425

self._revisioncache = None

425

self._revisioncache = None

426

if self._uncompressed_chunk_cache is not None:

426

if self._uncompressed_chunk_cache is not None:

427

self._uncompressed_chunk_cache.clear()

427

self._uncompressed_chunk_cache.clear()

428

self._segmentfile.clear_cache()

428

self._segmentfile.clear_cache()

429

self._segmentfile_sidedata.clear_cache()

429

self._segmentfile_sidedata.clear_cache()

430

431

@property

431

@property

432

def canonical_index_file(self):

432

def canonical_index_file(self):

433

if self._orig_index_file is not None:

433

if self._orig_index_file is not None:

434

return self._orig_index_file

434

return self._orig_index_file

435

return self.index_file

435

return self.index_file

436

437

@property

437

@property

438

def is_delaying(self):

438

def is_delaying(self):

439

"""is the revlog is currently delaying the visibility of written data?

439

"""is the revlog is currently delaying the visibility of written data?

440

441

The delaying mechanism can be either in-memory or written on disk in a

441

The delaying mechanism can be either in-memory or written on disk in a

442

side-file."""

442

side-file."""

443

return (self._delay_buffer is not None) or (

443

return (self._delay_buffer is not None) or (

444

self._orig_index_file is not None

444

self._orig_index_file is not None

445

)

445

)

446

447

# Derived from index values.

447

# Derived from index values.

448

449

def start(self, rev):

449

def start(self, rev):

450

"""the offset of the data chunk for this revision"""

450

"""the offset of the data chunk for this revision"""

451

return int(self.index[rev][0] >> 16)

451

return int(self.index[rev][0] >> 16)

452

453

def length(self, rev):

453

def length(self, rev):

454

"""the length of the data chunk for this revision"""

454

"""the length of the data chunk for this revision"""

455

return self.index[rev][1]

455

return self.index[rev][1]

456

457

def end(self, rev):

457

def end(self, rev):

458

"""the end of the data chunk for this revision"""

458

"""the end of the data chunk for this revision"""

459

return self.start(rev) + self.length(rev)

459

return self.start(rev) + self.length(rev)

460

461

def deltaparent(self, rev):

461

def deltaparent(self, rev):

462

"""return deltaparent of the given revision"""

462

"""return deltaparent of the given revision"""

463

base = self.index[rev][3]

463

base = self.index[rev][3]

464

if base == rev:

464

if base == rev:

465

return nullrev

465

return nullrev

466

elif self.delta_config.general_delta:

466

elif self.delta_config.general_delta:

467

return base

467

return base

468

else:

468

else:

469

return rev - 1

469

return rev - 1

470

471

def issnapshot(self, rev):

471

def issnapshot(self, rev):

472

"""tells whether rev is a snapshot"""

472

"""tells whether rev is a snapshot"""

473

if not self.delta_config.sparse_revlog:

473

if not self.delta_config.sparse_revlog:

474

return self.deltaparent(rev) == nullrev

474

return self.deltaparent(rev) == nullrev

475

elif hasattr(self.index, 'issnapshot'):

475

elif hasattr(self.index, 'issnapshot'):

476

# directly assign the method to cache the testing and access

476

# directly assign the method to cache the testing and access

477

self.issnapshot = self.index.issnapshot

477

self.issnapshot = self.index.issnapshot

478

return self.issnapshot(rev)

478

return self.issnapshot(rev)

479

if rev == nullrev:

479

if rev == nullrev:

480

return True

480

return True

481

entry = self.index[rev]

481

entry = self.index[rev]

482

base = entry[3]

482

base = entry[3]

483

if base == rev:

483

if base == rev:

484

return True

484

return True

485

if base == nullrev:

485

if base == nullrev:

486

return True

486

return True

487

p1 = entry[5]

487

p1 = entry[5]

488

while self.length(p1) == 0:

488

while self.length(p1) == 0:

489

b = self.deltaparent(p1)

489

b = self.deltaparent(p1)

490

if b == p1:

490

if b == p1:

491

break

491

break

492

p1 = b

492

p1 = b

493

p2 = entry[6]

493

p2 = entry[6]

494

while self.length(p2) == 0:

494

while self.length(p2) == 0:

495

b = self.deltaparent(p2)

495

b = self.deltaparent(p2)

496

if b == p2:

496

if b == p2:

497

break

497

break

498

p2 = b

498

p2 = b

499

if base == p1 or base == p2:

499

if base == p1 or base == p2:

500

return False

500

return False

501

return self.issnapshot(base)

501

return self.issnapshot(base)

502

503

def _deltachain(self, rev, stoprev=None):

503

def _deltachain(self, rev, stoprev=None):

504

"""Obtain the delta chain for a revision.

504

"""Obtain the delta chain for a revision.

505

506

``stoprev`` specifies a revision to stop at. If not specified, we

506

``stoprev`` specifies a revision to stop at. If not specified, we

507

stop at the base of the chain.

507

stop at the base of the chain.

508

509

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

509

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

510

revs in ascending order and ``stopped`` is a bool indicating whether

510

revs in ascending order and ``stopped`` is a bool indicating whether

511

``stoprev`` was hit.

511

``stoprev`` was hit.

512

"""

512

"""

513

generaldelta = self.delta_config.general_delta

513

generaldelta = self.delta_config.general_delta

514

# Try C implementation.

514

# Try C implementation.

515

try:

515

try:

516

return self.index.deltachain(rev, stoprev, generaldelta)

516

return self.index.deltachain(rev, stoprev, generaldelta)

517

except AttributeError:

517

except AttributeError:

518

pass

518

pass

519

520

chain = []

520

chain = []

521

522

# Alias to prevent attribute lookup in tight loop.

522

# Alias to prevent attribute lookup in tight loop.

523

index = self.index

523

index = self.index

524

525

iterrev = rev

525

iterrev = rev

526

e = index[iterrev]

526

e = index[iterrev]

527

while iterrev != e[3] and iterrev != stoprev:

527

while iterrev != e[3] and iterrev != stoprev:

528

chain.append(iterrev)

528

chain.append(iterrev)

529

if generaldelta:

529

if generaldelta:

530

iterrev = e[3]

530

iterrev = e[3]

531

else:

531

else:

532

iterrev -= 1

532

iterrev -= 1

533

e = index[iterrev]

533

e = index[iterrev]

534

535

if iterrev == stoprev:

535

if iterrev == stoprev:

536

stopped = True

536

stopped = True

537

else:

537

else:

538

chain.append(iterrev)

538

chain.append(iterrev)

539

stopped = False

539

stopped = False

540

541

chain.reverse()

541

chain.reverse()

542

return chain, stopped

542

return chain, stopped

543

544

@util.propertycache

544

@util.propertycache

545

def _compressor(self):

545

def _compressor(self):

546

engine = util.compengines[self.feature_config.compression_engine]

546

engine = util.compengines[self.feature_config.compression_engine]

547

return engine.revlogcompressor(

547

return engine.revlogcompressor(

548

self.feature_config.compression_engine_options

548

self.feature_config.compression_engine_options

549

)

549

)

550

551

@util.propertycache

551

@util.propertycache

552

def _decompressor(self):

552

def _decompressor(self):

553

"""the default decompressor"""

553

"""the default decompressor"""

554

if self._default_compression_header is None:

554

if self._default_compression_header is None:

555

return None

555

return None

556

t = self._default_compression_header

556

t = self._default_compression_header

557

c = self._get_decompressor(t)

557

c = self._get_decompressor(t)

558

return c.decompress

558

return c.decompress

559

560

def _get_decompressor(self, t):

560

def _get_decompressor(self, t):

561

try:

561

try:

562

compressor = self._decompressors[t]

562

compressor = self._decompressors[t]

563

except KeyError:

563

except KeyError:

564

try:

564

try:

565

engine = util.compengines.forrevlogheader(t)

565

engine = util.compengines.forrevlogheader(t)

566

compressor = engine.revlogcompressor(

566

compressor = engine.revlogcompressor(

567

self.feature_config.compression_engine_options

567

self.feature_config.compression_engine_options

568

)

568

)

569

self._decompressors[t] = compressor

569

self._decompressors[t] = compressor

570

except KeyError:

570

except KeyError:

571

raise error.RevlogError(

571

raise error.RevlogError(

572

_(b'unknown compression type %s') % binascii.hexlify(t)

572

_(b'unknown compression type %s') % binascii.hexlify(t)

573

)

573

)

574

return compressor

574

return compressor

575

576

def compress(self, data):

576

def compress(self, data):

577

"""Generate a possibly-compressed representation of data."""

577

"""Generate a possibly-compressed representation of data."""

578

if not data:

578

if not data:

579

return b'', data

579

return b'', data

580

581

compressed = self._compressor.compress(data)

581

compressed = self._compressor.compress(data)

582

583

if compressed:

583

if compressed:

584

# The revlog compressor added the header in the returned data.

584

# The revlog compressor added the header in the returned data.

585

return b'', compressed

585

return b'', compressed

586

587

if data[0:1] == b'\0':

587

if data[0:1] == b'\0':

588

return b'', data

588

return b'', data

589

return b'u', data

589

return b'u', data

590

591

def decompress(self, data):

591

def decompress(self, data):

592

"""Decompress a revlog chunk.

592

"""Decompress a revlog chunk.

593

594

The chunk is expected to begin with a header identifying the

594

The chunk is expected to begin with a header identifying the

595

format type so it can be routed to an appropriate decompressor.

595

format type so it can be routed to an appropriate decompressor.

596

"""

596

"""

597

if not data:

597

if not data:

598

return data

598

return data

599

600

# Revlogs are read much more frequently than they are written and many

600

# Revlogs are read much more frequently than they are written and many

601

# chunks only take microseconds to decompress, so performance is

601

# chunks only take microseconds to decompress, so performance is

602

# important here.

602

# important here.

603

#

603

#

604

# We can make a few assumptions about revlogs:

604

# We can make a few assumptions about revlogs:

605

#

605

#

606

# 1) the majority of chunks will be compressed (as opposed to inline

606

# 1) the majority of chunks will be compressed (as opposed to inline

607

# raw data).

607

# raw data).

608

# 2) decompressing *any* data will likely by at least 10x slower than

608

# 2) decompressing *any* data will likely by at least 10x slower than

609

# returning raw inline data.

609

# returning raw inline data.

610

# 3) we want to prioritize common and officially supported compression

610

# 3) we want to prioritize common and officially supported compression

611

# engines

611

# engines

612

#

612

#

613

# It follows that we want to optimize for "decompress compressed data

613

# It follows that we want to optimize for "decompress compressed data

614

# when encoded with common and officially supported compression engines"

614

# when encoded with common and officially supported compression engines"

615

# case over "raw data" and "data encoded by less common or non-official

615

# case over "raw data" and "data encoded by less common or non-official

616

# compression engines." That is why we have the inline lookup first

616

# compression engines." That is why we have the inline lookup first

617

# followed by the compengines lookup.

617

# followed by the compengines lookup.

618

#

618

#

619

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

619

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

620

# compressed chunks. And this matters for changelog and manifest reads.

620

# compressed chunks. And this matters for changelog and manifest reads.

621

t = data[0:1]

621

t = data[0:1]

622

623

if t == b'x':

623

if t == b'x':

624

try:

624

try:

625

return _zlibdecompress(data)

625

return _zlibdecompress(data)

626

except zlib.error as e:

626

except zlib.error as e:

627

raise error.RevlogError(

627

raise error.RevlogError(

628

_(b'revlog decompress error: %s')

628

_(b'revlog decompress error: %s')

629

% stringutil.forcebytestr(e)

629

% stringutil.forcebytestr(e)

630

)

630

)

631

# '\0' is more common than 'u' so it goes first.

631

# '\0' is more common than 'u' so it goes first.

632

elif t == b'\0':

632

elif t == b'\0':

633

return data

633

return data

634

elif t == b'u':

634

elif t == b'u':

635

return util.buffer(data, 1)

635

return util.buffer(data, 1)

636

637

compressor = self._get_decompressor(t)

637

compressor = self._get_decompressor(t)

638

639

return compressor.decompress(data)

639

return compressor.decompress(data)

640

641

@contextlib.contextmanager

641

@contextlib.contextmanager

642

def reading(self):

642

def reading(self):

643

"""Context manager that keeps data and sidedata files open for reading"""

643

"""Context manager that keeps data and sidedata files open for reading"""

644

if len(self.index) == 0:

644

if len(self.index) == 0:

645

yield # nothing to be read

645

yield # nothing to be read

646

elif self._delay_buffer is not None and self.inline:

646

elif self._delay_buffer is not None and self.inline:

647

msg = "revlog with delayed write should not be inline"

647

msg = "revlog with delayed write should not be inline"

648

raise error.ProgrammingError(msg)

648

raise error.ProgrammingError(msg)

649

else:

649

else:

650

with self._segmentfile.reading():

650

with self._segmentfile.reading():

651

with self._segmentfile_sidedata.reading():

651

with self._segmentfile_sidedata.reading():

652

yield

652

yield

653

654

@property

654

@property

655

def is_writing(self):

655

def is_writing(self):

656

"""True is a writing context is open"""

656

"""True is a writing context is open"""

657

return self._writinghandles is not None

657

return self._writinghandles is not None

658

659

@property

659

@property

660

def is_open(self):

660

def is_open(self):

661

"""True if any file handle is being held

661

"""True if any file handle is being held

662

663

Used for assert and debug in the python code"""

663

Used for assert and debug in the python code"""

664

return self._segmentfile.is_open or self._segmentfile_sidedata.is_open

664

return self._segmentfile.is_open or self._segmentfile_sidedata.is_open

665

666

@contextlib.contextmanager

666

@contextlib.contextmanager

667

def writing(self, transaction, data_end=None, sidedata_end=None):

667

def writing(self, transaction, data_end=None, sidedata_end=None):

668

"""Open the revlog files for writing

668

"""Open the revlog files for writing

669

670

Add content to a revlog should be done within such context.

670

Add content to a revlog should be done within such context.

671

"""

671

"""

672

if self.is_writing:

672

if self.is_writing:

673

yield

673

yield

674

else:

674

else:

675

ifh = dfh = sdfh = None

675

ifh = dfh = sdfh = None

676

try:

676

try:

677

r = len(self.index)

677

r = len(self.index)

678

# opening the data file.

678

# opening the data file.

679

dsize = 0

679

dsize = 0

680

if r:

680

if r:

681

dsize = self.end(r - 1)

681

dsize = self.end(r - 1)

682

dfh = None

682

dfh = None

683

if not self.inline:

683

if not self.inline:

684

try:

684

try:

685

dfh = self.opener(self.data_file, mode=b"r+")

685

dfh = self.opener(self.data_file, mode=b"r+")

686

if data_end is None:

686

if data_end is None:

687

dfh.seek(0, os.SEEK_END)

687

dfh.seek(0, os.SEEK_END)

688

else:

688

else:

689

dfh.seek(data_end, os.SEEK_SET)

689

dfh.seek(data_end, os.SEEK_SET)

690

except FileNotFoundError:

690

except FileNotFoundError:

691

dfh = self.opener(self.data_file, mode=b"w+")

691

dfh = self.opener(self.data_file, mode=b"w+")

692

transaction.add(self.data_file, dsize)

692

transaction.add(self.data_file, dsize)

693

if self.sidedata_file is not None:

693

if self.sidedata_file is not None:

694

assert sidedata_end is not None

694

assert sidedata_end is not None

695

# revlog-v2 does not inline, help Pytype

695

# revlog-v2 does not inline, help Pytype

696

assert dfh is not None

696

assert dfh is not None

697

try:

697

try:

698

sdfh = self.opener(self.sidedata_file, mode=b"r+")

698

sdfh = self.opener(self.sidedata_file, mode=b"r+")

699

dfh.seek(sidedata_end, os.SEEK_SET)

699

dfh.seek(sidedata_end, os.SEEK_SET)

700

except FileNotFoundError:

700

except FileNotFoundError:

701

sdfh = self.opener(self.sidedata_file, mode=b"w+")

701

sdfh = self.opener(self.sidedata_file, mode=b"w+")

702

transaction.add(self.sidedata_file, sidedata_end)

702

transaction.add(self.sidedata_file, sidedata_end)

703

704

# opening the index file.

704

# opening the index file.

705

isize = r * self.index.entry_size

705

isize = r * self.index.entry_size

706

ifh = self.__index_write_fp()

706

ifh = self.__index_write_fp()

707

if self.inline:

707

if self.inline:

708

transaction.add(self.index_file, dsize + isize)

708

transaction.add(self.index_file, dsize + isize)

709

else:

709

else:

710

transaction.add(self.index_file, isize)

710

transaction.add(self.index_file, isize)

711

# exposing all file handle for writing.

711

# exposing all file handle for writing.

712

self._writinghandles = (ifh, dfh, sdfh)

712

self._writinghandles = (ifh, dfh, sdfh)

713

self._segmentfile.writing_handle = ifh if self.inline else dfh

713

self._segmentfile.writing_handle = ifh if self.inline else dfh

714

self._segmentfile_sidedata.writing_handle = sdfh

714

self._segmentfile_sidedata.writing_handle = sdfh

715

yield

715

yield

716

finally:

716

finally:

717

self._writinghandles = None

717

self._writinghandles = None

718

self._segmentfile.writing_handle = None

718

self._segmentfile.writing_handle = None

719

self._segmentfile_sidedata.writing_handle = None

719

self._segmentfile_sidedata.writing_handle = None

720

if dfh is not None:

720

if dfh is not None:

721

dfh.close()

721

dfh.close()

722

if sdfh is not None:

722

if sdfh is not None:

723

sdfh.close()

723

sdfh.close()

724

# closing the index file last to avoid exposing referent to

724

# closing the index file last to avoid exposing referent to

725

# potential unflushed data content.

725

# potential unflushed data content.

726

if ifh is not None:

726

if ifh is not None:

727

ifh.close()

727

ifh.close()

728

729

def __index_write_fp(self, index_end=None):

729

def __index_write_fp(self, index_end=None):

730

"""internal method to open the index file for writing

730

"""internal method to open the index file for writing

731

732

You should not use this directly and use `_writing` instead

732

You should not use this directly and use `_writing` instead

733

"""

733

"""

734

try:

734

try:

735

if self._delay_buffer is None:

735

if self._delay_buffer is None:

736

f = self.opener(

736

f = self.opener(

737

self.index_file,

737

self.index_file,

738

mode=b"r+",

738

mode=b"r+",

739

checkambig=self.data_config.check_ambig,

739

checkambig=self.data_config.check_ambig,

740

)

740

)

741

else:

741

else:

742

# check_ambig affect we way we open file for writing, however

742

# check_ambig affect we way we open file for writing, however

743

# here, we do not actually open a file for writting as write

743

# here, we do not actually open a file for writting as write

744

# will appened to a delay_buffer. So check_ambig is not

744

# will appened to a delay_buffer. So check_ambig is not

745

# meaningful and unneeded here.

745

# meaningful and unneeded here.

746

f = randomaccessfile.appender(

746

f = randomaccessfile.appender(

747

self.opener, self.index_file, b"r+", self._delay_buffer

747

self.opener, self.index_file, b"r+", self._delay_buffer

748

)

748

)

749

if index_end is None:

749

if index_end is None:

750

f.seek(0, os.SEEK_END)

750

f.seek(0, os.SEEK_END)

751

else:

751

else:

752

f.seek(index_end, os.SEEK_SET)

752

f.seek(index_end, os.SEEK_SET)

753

return f

753

return f

754

except FileNotFoundError:

754

except FileNotFoundError:

755

if self._delay_buffer is None:

755

if self._delay_buffer is None:

756

return self.opener(

756

return self.opener(

757

self.index_file,

757

self.index_file,

758

mode=b"w+",

758

mode=b"w+",

759

checkambig=self.data_config.check_ambig,

759

checkambig=self.data_config.check_ambig,

760

)

760

)

761

else:

761

else:

762

return randomaccessfile.appender(

762

return randomaccessfile.appender(

763

self.opener, self.index_file, b"w+", self._delay_buffer

763

self.opener, self.index_file, b"w+", self._delay_buffer

764

)

764

)

765

766

def __index_new_fp(self):

766

def __index_new_fp(self):

767

"""internal method to create a new index file for writing

767

"""internal method to create a new index file for writing

768

769

You should not use this unless you are upgrading from inline revlog

769

You should not use this unless you are upgrading from inline revlog

770

"""

770

"""

771

return self.opener(

771

return self.opener(

772

self.index_file,

772

self.index_file,

773

mode=b"w",

773

mode=b"w",

774

checkambig=self.data_config.check_ambig,

774

checkambig=self.data_config.check_ambig,

775

atomictemp=True,

775

atomictemp=True,

776

)

776

)

777

778

def split_inline(self, tr, header, new_index_file_path=None):

778

def split_inline(self, tr, header, new_index_file_path=None):

779

"""split the data of an inline revlog into an index and a data file"""

779

"""split the data of an inline revlog into an index and a data file"""

780

assert self._delay_buffer is None

780

assert self._delay_buffer is None

781

existing_handles = False

781

existing_handles = False

782

if self._writinghandles is not None:

782

if self._writinghandles is not None:

783

existing_handles = True

783

existing_handles = True

784

fp = self._writinghandles[0]

784

fp = self._writinghandles[0]

785

fp.flush()

785

fp.flush()

786

fp.close()

786

fp.close()

787

# We can't use the cached file handle after close(). So prevent

787

# We can't use the cached file handle after close(). So prevent

788

# its usage.

788

# its usage.

789

self._writinghandles = None

789

self._writinghandles = None

790

self._segmentfile.writing_handle = None

790

self._segmentfile.writing_handle = None

791

# No need to deal with sidedata writing handle as it is only

791

# No need to deal with sidedata writing handle as it is only

792

# relevant with revlog-v2 which is never inline, not reaching

792

# relevant with revlog-v2 which is never inline, not reaching

793

# this code

793

# this code

794

795

new_dfh = self.opener(self.data_file, mode=b"w+")

795

new_dfh = self.opener(self.data_file, mode=b"w+")

796

new_dfh.truncate(0) # drop any potentially existing data

796

new_dfh.truncate(0) # drop any potentially existing data

797

try:

797

try:

798

with self.reading():

798

with self.reading():

799

for r in range(len(self.index)):

799

for r in range(len(self.index)):

800

new_dfh.write(self.get_segment_for_revs(r, r)[1])

800

new_dfh.write(self.get_segment_for_revs(r, r)[1])

801

new_dfh.flush()

801

new_dfh.flush()

802

803

if new_index_file_path is not None:

803

if new_index_file_path is not None:

804

self.index_file = new_index_file_path

804

self.index_file = new_index_file_path

805

with self.__index_new_fp() as fp:

805

with self.__index_new_fp() as fp:

806

self.inline = False

806

self.inline = False

807

for i in range(len(self.index)):

807

for i in range(len(self.index)):

808

e = self.index.entry_binary(i)

808

e = self.index.entry_binary(i)

809

if i == 0:

809

if i == 0:

810

packed_header = self.index.pack_header(header)

810

packed_header = self.index.pack_header(header)

811

e = packed_header + e

811

e = packed_header + e

812

fp.write(e)

812

fp.write(e)

813

814

# If we don't use side-write, the temp file replace the real

814

# If we don't use side-write, the temp file replace the real

815

# index when we exit the context manager

815

# index when we exit the context manager

816

817

self._segmentfile = randomaccessfile.randomaccessfile(

817

self._segmentfile = randomaccessfile.randomaccessfile(

818

self.opener,

818

self.opener,

819

self.data_file,

819

self.data_file,

820

self.data_config.chunk_cache_size,

820

self.data_config.chunk_cache_size,

821

)

821

)

822

823

if existing_handles:

823

if existing_handles:

824

# switched from inline to conventional reopen the index

824

# switched from inline to conventional reopen the index

825

ifh = self.__index_write_fp()

825

ifh = self.__index_write_fp()

826

self._writinghandles = (ifh, new_dfh, None)

826

self._writinghandles = (ifh, new_dfh, None)

827

self._segmentfile.writing_handle = new_dfh

827

self._segmentfile.writing_handle = new_dfh

828

new_dfh = None

828

new_dfh = None

829

# No need to deal with sidedata writing handle as it is only

829

# No need to deal with sidedata writing handle as it is only

830

# relevant with revlog-v2 which is never inline, not reaching

830

# relevant with revlog-v2 which is never inline, not reaching

831

# this code

831

# this code

832

finally:

832

finally:

833

if new_dfh is not None:

833

if new_dfh is not None:

834

new_dfh.close()

834

new_dfh.close()

835

return self.index_file

835

return self.index_file

836

837

def get_segment_for_revs(self, startrev, endrev):

837

def get_segment_for_revs(self, startrev, endrev):

838

"""Obtain a segment of raw data corresponding to a range of revisions.

838

"""Obtain a segment of raw data corresponding to a range of revisions.

839

840

Accepts the start and end revisions and an optional already-open

840

Accepts the start and end revisions and an optional already-open

841

file handle to be used for reading. If the file handle is read, its

841

file handle to be used for reading. If the file handle is read, its

842

seek position will not be preserved.

842

seek position will not be preserved.

843

844

Requests for data may be satisfied by a cache.

844

Requests for data may be satisfied by a cache.

845

846

Returns a 2-tuple of (offset, data) for the requested range of

846

Returns a 2-tuple of (offset, data) for the requested range of

847

revisions. Offset is the integer offset from the beginning of the

847

revisions. Offset is the integer offset from the beginning of the

848

revlog and data is a str or buffer of the raw byte data.

848

revlog and data is a str or buffer of the raw byte data.

849

850

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

850

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

851

to determine where each revision's data begins and ends.

851

to determine where each revision's data begins and ends.

852

853

API: we should consider making this a private part of the InnerRevlog

853

API: we should consider making this a private part of the InnerRevlog

854

at some point.

854

at some point.

855

"""

855

"""

856

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

856

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

857

# (functions are expensive).

857

# (functions are expensive).

858

index = self.index

858

index = self.index

859

istart = index[startrev]

859

istart = index[startrev]

860

start = int(istart[0] >> 16)

860

start = int(istart[0] >> 16)

861

if startrev == endrev:

861

if startrev == endrev:

862

end = start + istart[1]

862

end = start + istart[1]

863

else:

863

else:

864

iend = index[endrev]

864

iend = index[endrev]

865

end = int(iend[0] >> 16) + iend[1]

865

end = int(iend[0] >> 16) + iend[1]

866

867

if self.inline:

867

if self.inline:

868

start += (startrev + 1) * self.index.entry_size

868

start += (startrev + 1) * self.index.entry_size

869

end += (endrev + 1) * self.index.entry_size

869

end += (endrev + 1) * self.index.entry_size

870

length = end - start

870

length = end - start

871

872

return start, self._segmentfile.read_chunk(start, length)

872

return start, self._segmentfile.read_chunk(start, length)

873

874

def _chunk(self, rev):

874

def _chunk(self, rev):

875

"""Obtain a single decompressed chunk for a revision.

875

"""Obtain a single decompressed chunk for a revision.

876

877

Accepts an integer revision and an optional already-open file handle

877

Accepts an integer revision and an optional already-open file handle

878

to be used for reading. If used, the seek position of the file will not

878

to be used for reading. If used, the seek position of the file will not

879

be preserved.

879

be preserved.

880

881

Returns a str holding uncompressed data for the requested revision.

881

Returns a str holding uncompressed data for the requested revision.

882

"""

882

"""

883

if self._uncompressed_chunk_cache is not None:

883

if self._uncompressed_chunk_cache is not None:

884

uncomp = self._uncompressed_chunk_cache.get(rev)

884

uncomp = self._uncompressed_chunk_cache.get(rev)

885

if uncomp is not None:

885

if uncomp is not None:

886

return uncomp

886

return uncomp

887

888

compression_mode = self.index[rev][10]

888

compression_mode = self.index[rev][10]

889

data = self.get_segment_for_revs(rev, rev)[1]

889

data = self.get_segment_for_revs(rev, rev)[1]

890

if compression_mode == COMP_MODE_PLAIN:

890

if compression_mode == COMP_MODE_PLAIN:

891

uncomp = data

891

uncomp = data

892

elif compression_mode == COMP_MODE_DEFAULT:

892

elif compression_mode == COMP_MODE_DEFAULT:

893

uncomp = self._decompressor(data)

893

uncomp = self._decompressor(data)

894

elif compression_mode == COMP_MODE_INLINE:

894

elif compression_mode == COMP_MODE_INLINE:

895

uncomp = self.decompress(data)

895

uncomp = self.decompress(data)

896

else:

896

else:

897

msg = b'unknown compression mode %d'

897

msg = b'unknown compression mode %d'

898

msg %= compression_mode

898

msg %= compression_mode

899

raise error.RevlogError(msg)

899

raise error.RevlogError(msg)

900

if self._uncompressed_chunk_cache is not None:

900

if self._uncompressed_chunk_cache is not None:

901

self._uncompressed_chunk_cache.insert(rev, uncomp, cost=len(uncomp))

901

self._uncompressed_chunk_cache.insert(rev, uncomp, cost=len(uncomp))

902

return uncomp

902

return uncomp

903

904

def _chunks(self, revs, targetsize=None):

904

def _chunks(self, revs, targetsize=None):

905

"""Obtain decompressed chunks for the specified revisions.

905

"""Obtain decompressed chunks for the specified revisions.

906

907

Accepts an iterable of numeric revisions that are assumed to be in

907

Accepts an iterable of numeric revisions that are assumed to be in

908

ascending order. Also accepts an optional already-open file handle

908

ascending order. Also accepts an optional already-open file handle

909

to be used for reading. If used, the seek position of the file will

909

to be used for reading. If used, the seek position of the file will

910

not be preserved.

910

not be preserved.

911

912

This function is similar to calling ``self._chunk()`` multiple times,

912

This function is similar to calling ``self._chunk()`` multiple times,

913

but is faster.

913

but is faster.

914

915

Returns a list with decompressed data for each requested revision.

915

Returns a list with decompressed data for each requested revision.

916

"""

916

"""

917

if not revs:

917

if not revs:

918

return []

918

return []

919

start = self.start

919

start = self.start

920

length = self.length

920

length = self.length

921

inline = self.inline

921

inline = self.inline

922

iosize = self.index.entry_size

922

iosize = self.index.entry_size

923

buffer = util.buffer

923

buffer = util.buffer

924

925

fetched_revs = []

925

fetched_revs = []

926

fadd = fetched_revs.append

926

fadd = fetched_revs.append

927

928

chunks = []

928

chunks = []

929

ladd = chunks.append

929

ladd = chunks.append

930

931

if self._uncompressed_chunk_cache is None:

931

if self._uncompressed_chunk_cache is None:

932

fetched_revs = revs

932

fetched_revs = revs

933

else:

933

else:

934

for rev in revs:

934

for rev in revs:

935

cached_value = self._uncompressed_chunk_cache.get(rev)

935

cached_value = self._uncompressed_chunk_cache.get(rev)

936

if cached_value is None:

936

if cached_value is None:

937

fadd(rev)

937

fadd(rev)

938

else:

938

else:

939

ladd((rev, cached_value))

939

ladd((rev, cached_value))

940

941

if not fetched_revs:

941

if not fetched_revs:

942

slicedchunks = ()

942

slicedchunks = ()

943

elif not self.data_config.with_sparse_read:

943

elif not self.data_config.with_sparse_read:

944

slicedchunks = (fetched_revs,)

944

slicedchunks = (fetched_revs,)

945

else:

945

else:

946

slicedchunks = deltautil.slicechunk(

946

slicedchunks = deltautil.slicechunk(

947

self,

947

self,

948

fetched_revs,

948

fetched_revs,

949

targetsize=targetsize,

949

targetsize=targetsize,

950

)

950

)

951

952

for revschunk in slicedchunks:

952

for revschunk in slicedchunks:

953

firstrev = revschunk[0]

953

firstrev = revschunk[0]

954

# Skip trailing revisions with empty diff

954

# Skip trailing revisions with empty diff

955

for lastrev in revschunk[::-1]:

955

for lastrev in revschunk[::-1]:

956

if length(lastrev) != 0:

956

if length(lastrev) != 0:

957

break

957

break

958

959

try:

959

try:

960

offset, data = self.get_segment_for_revs(firstrev, lastrev)

960

offset, data = self.get_segment_for_revs(firstrev, lastrev)

961

except OverflowError:

961

except OverflowError:

962

# issue4215 - we can't cache a run of chunks greater than

962

# issue4215 - we can't cache a run of chunks greater than

963

# 2G on Windows

963

# 2G on Windows

964

for rev in revschunk:

964

for rev in revschunk:

965

ladd((rev, self._chunk(rev)))

965

ladd((rev, self._chunk(rev)))

966

967

decomp = self.decompress

967

decomp = self.decompress

968

# self._decompressor might be None, but will not be used in that case

968

# self._decompressor might be None, but will not be used in that case

969

def_decomp = self._decompressor

969

def_decomp = self._decompressor

970

for rev in revschunk:

970

for rev in revschunk:

971

chunkstart = start(rev)

971

chunkstart = start(rev)

972

if inline:

972

if inline:

973

chunkstart += (rev + 1) * iosize

973

chunkstart += (rev + 1) * iosize

974

chunklength = length(rev)

974

chunklength = length(rev)

975

comp_mode = self.index[rev][10]

975

comp_mode = self.index[rev][10]

976

c = buffer(data, chunkstart - offset, chunklength)

976

c = buffer(data, chunkstart - offset, chunklength)

977

if comp_mode == COMP_MODE_PLAIN:

977

if comp_mode == COMP_MODE_PLAIN:

978

c = c

978

c = c

979

elif comp_mode == COMP_MODE_INLINE:

979

elif comp_mode == COMP_MODE_INLINE:

980

c = decomp(c)

980

c = decomp(c)

981

elif comp_mode == COMP_MODE_DEFAULT:

981

elif comp_mode == COMP_MODE_DEFAULT:

982

c = def_decomp(c)

982

c = def_decomp(c)

983

else:

983

else:

984

msg = b'unknown compression mode %d'

984

msg = b'unknown compression mode %d'

985

msg %= comp_mode

985

msg %= comp_mode

986

raise error.RevlogError(msg)

986

raise error.RevlogError(msg)

987

ladd((rev, c))

987

ladd((rev, c))

988

if self._uncompressed_chunk_cache is not None:

988

if self._uncompressed_chunk_cache is not None:

989

self._uncompressed_chunk_cache.insert(rev, c, len(c))

989

self._uncompressed_chunk_cache.insert(rev, c, len(c))

990

991

chunks.sort()

991

chunks.sort()

992

return [x[1] for x in chunks]

992

return [x[1] for x in chunks]

993

994

def raw_text(self, node, rev):

994

def raw_text(self, node, rev):

995

"""return the possibly unvalidated rawtext for a revision

995

"""return the possibly unvalidated rawtext for a revision

996

997

returns (rev, rawtext, validated)

997

returns (rev, rawtext, validated)

998

"""

998

"""

999

1000

# revision in the cache (could be useful to apply delta)

1000

# revision in the cache (could be useful to apply delta)

1001

cachedrev = None

1001

cachedrev = None

1002

# An intermediate text to apply deltas to

1002

# An intermediate text to apply deltas to

1003

basetext = None

1003

basetext = None

1004

1005

# Check if we have the entry in cache

1005

# Check if we have the entry in cache

1006

# The cache entry looks like (node, rev, rawtext)

1006

# The cache entry looks like (node, rev, rawtext)

1007

if self._revisioncache:

1007

if self._revisioncache:

1008

cachedrev = self._revisioncache[1]

1008

cachedrev = self._revisioncache[1]

1009

1010

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

1010

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

1011

if stopped:

1011

if stopped:

1012

basetext = self._revisioncache[2]

1012

basetext = self._revisioncache[2]

1013

1014

# drop cache to save memory, the caller is expected to

1014

# drop cache to save memory, the caller is expected to

1015

# update self._inner._revisioncache after validating the text

1015

# update self._inner._revisioncache after validating the text

1016

self._revisioncache = None

1016

self._revisioncache = None

1017

1018

targetsize = None

1018

targetsize = None

1019

rawsize = self.index[rev][2]

1019

rawsize = self.index[rev][2]

1020

if 0 <= rawsize:

1020

if 0 <= rawsize:

1021

targetsize = 4 * rawsize

1021

targetsize = 4 * rawsize

1022

1023

if self._uncompressed_chunk_cache is not None:

1023

if self._uncompressed_chunk_cache is not None:

1024

# dynamically update the uncompressed_chunk_cache size to the

1024

# dynamically update the uncompressed_chunk_cache size to the

1025

# largest revision we saw in this revlog.

1025

# largest revision we saw in this revlog.

1026

factor = self.data_config.uncompressed_cache_factor

1026

factor = self.data_config.uncompressed_cache_factor

1027

candidate_size = rawsize * factor

1027

candidate_size = rawsize * factor

1028

if candidate_size > self._uncompressed_chunk_cache.maxcost:

1028

if candidate_size > self._uncompressed_chunk_cache.maxcost:

1029

self._uncompressed_chunk_cache.maxcost = candidate_size

1029

self._uncompressed_chunk_cache.maxcost = candidate_size

1030

1031

bins = self._chunks(chain, targetsize=targetsize)

1031

bins = self._chunks(chain, targetsize=targetsize)

1032

if basetext is None:

1032

if basetext is None:

1033

basetext = bytes(bins[0])

1033

basetext = bytes(bins[0])

1034

bins = bins[1:]

1034

bins = bins[1:]

1035

1036

rawtext = mdiff.patches(basetext, bins)

1036

rawtext = mdiff.patches(basetext, bins)

1037

del basetext # let us have a chance to free memory early

1037

del basetext # let us have a chance to free memory early

1038

return (rev, rawtext, False)

1038

return (rev, rawtext, False)

1039

1040

def sidedata(self, rev, sidedata_end):

1040

def sidedata(self, rev, sidedata_end):

1041

"""Return the sidedata for a given revision number."""

1041

"""Return the sidedata for a given revision number."""

1042

index_entry = self.index[rev]

1042

index_entry = self.index[rev]

1043

sidedata_offset = index_entry[8]

1043

sidedata_offset = index_entry[8]

1044

sidedata_size = index_entry[9]

1044

sidedata_size = index_entry[9]

1045

1046

if self.inline:

1046

if self.inline:

1047

sidedata_offset += self.index.entry_size * (1 + rev)

1047

sidedata_offset += self.index.entry_size * (1 + rev)

1048

if sidedata_size == 0:

1048

if sidedata_size == 0:

1049

return {}

1049

return {}

1050

1051

if sidedata_end < sidedata_offset + sidedata_size:

1051

if sidedata_end < sidedata_offset + sidedata_size:

1052

filename = self.sidedata_file

1052

filename = self.sidedata_file

1053

end = sidedata_end

1053

end = sidedata_end

1054

offset = sidedata_offset

1054

offset = sidedata_offset

1055

length = sidedata_size

1055

length = sidedata_size

1056

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

1056

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

1057

raise error.RevlogError(m)

1057

raise error.RevlogError(m)

1058

1059

comp_segment = self._segmentfile_sidedata.read_chunk(

1059

comp_segment = self._segmentfile_sidedata.read_chunk(

1060

sidedata_offset, sidedata_size

1060

sidedata_offset, sidedata_size

1061

)

1061

)

1062

1063

comp = self.index[rev][11]

1063

comp = self.index[rev][11]

1064

if comp == COMP_MODE_PLAIN:

1064

if comp == COMP_MODE_PLAIN:

1065

segment = comp_segment

1065

segment = comp_segment

1066

elif comp == COMP_MODE_DEFAULT:

1066

elif comp == COMP_MODE_DEFAULT:

1067

segment = self._decompressor(comp_segment)

1067

segment = self._decompressor(comp_segment)

1068

elif comp == COMP_MODE_INLINE:

1068

elif comp == COMP_MODE_INLINE:

1069

segment = self.decompress(comp_segment)

1069

segment = self.decompress(comp_segment)

1070

else:

1070

else:

1071

msg = b'unknown compression mode %d'

1071

msg = b'unknown compression mode %d'

1072

msg %= comp

1072

msg %= comp

1073

raise error.RevlogError(msg)

1073

raise error.RevlogError(msg)

1074

1075

sidedata = sidedatautil.deserialize_sidedata(segment)

1075

sidedata = sidedatautil.deserialize_sidedata(segment)

1076

return sidedata

1076

return sidedata

1077

1078

def write_entry(

1078

def write_entry(

1079

self,

1079

self,

1080

transaction,

1080

transaction,

1081

entry,

1081

entry,

1082

data,

1082

data,

1083

link,

1083

link,

1084

offset,

1084

offset,

1085

sidedata,

1085

sidedata,

1086

sidedata_offset,

1086

sidedata_offset,

1087

index_end,

1087

index_end,

1088

data_end,

1088

data_end,

1089

sidedata_end,

1089

sidedata_end,

1090

):

1090

):

1091

# Files opened in a+ mode have inconsistent behavior on various

1091

# Files opened in a+ mode have inconsistent behavior on various

1092

# platforms. Windows requires that a file positioning call be made

1092

# platforms. Windows requires that a file positioning call be made

1093

# when the file handle transitions between reads and writes. See

1093

# when the file handle transitions between reads and writes. See

1094

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

1094

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

1095

# platforms, Python or the platform itself can be buggy. Some versions

1095

# platforms, Python or the platform itself can be buggy. Some versions

1096

# of Solaris have been observed to not append at the end of the file

1096

# of Solaris have been observed to not append at the end of the file

1097

# if the file was seeked to before the end. See issue4943 for more.

1097

# if the file was seeked to before the end. See issue4943 for more.

1098

#

1098

#

1099

# We work around this issue by inserting a seek() before writing.

1099

# We work around this issue by inserting a seek() before writing.

1100

# Note: This is likely not necessary on Python 3. However, because

1100

# Note: This is likely not necessary on Python 3. However, because

1101

# the file handle is reused for reads and may be seeked there, we need

1101

# the file handle is reused for reads and may be seeked there, we need

1102

# to be careful before changing this.

1102

# to be careful before changing this.

1103

if self._writinghandles is None:

1103

if self._writinghandles is None:

1104

msg = b'adding revision outside `revlog._writing` context'

1104

msg = b'adding revision outside `revlog._writing` context'

1105

raise error.ProgrammingError(msg)

1105

raise error.ProgrammingError(msg)

1106

ifh, dfh, sdfh = self._writinghandles

1106

ifh, dfh, sdfh = self._writinghandles

1107

if index_end is None:

1107

if index_end is None:

1108

ifh.seek(0, os.SEEK_END)

1108

ifh.seek(0, os.SEEK_END)

1109

else:

1109

else:

1110

ifh.seek(index_end, os.SEEK_SET)

1110

ifh.seek(index_end, os.SEEK_SET)

1111

if dfh:

1111

if dfh:

1112

if data_end is None:

1112

if data_end is None:

1113

dfh.seek(0, os.SEEK_END)

1113

dfh.seek(0, os.SEEK_END)

1114

else:

1114

else:

1115

dfh.seek(data_end, os.SEEK_SET)

1115

dfh.seek(data_end, os.SEEK_SET)

1116

if sdfh:

1116

if sdfh:

1117

sdfh.seek(sidedata_end, os.SEEK_SET)

1117

sdfh.seek(sidedata_end, os.SEEK_SET)

1118

1119

curr = len(self.index) - 1

1119

curr = len(self.index) - 1

1120

if not self.inline:

1120

if not self.inline:

1121

transaction.add(self.data_file, offset)

1121

transaction.add(self.data_file, offset)

1122

if self.sidedata_file:

1122

if self.sidedata_file:

1123

transaction.add(self.sidedata_file, sidedata_offset)

1123

transaction.add(self.sidedata_file, sidedata_offset)

1124

transaction.add(self.canonical_index_file, curr * len(entry))

1124

transaction.add(self.canonical_index_file, curr * len(entry))

1125

if data[0]:

1125

if data[0]:

1126

dfh.write(data[0])

1126

dfh.write(data[0])

1127

dfh.write(data[1])

1127

dfh.write(data[1])

1128

if sidedata:

1128

if sidedata:

1129

sdfh.write(sidedata)

1129

sdfh.write(sidedata)

1130

if self._delay_buffer is None:

1130

if self._delay_buffer is None:

1131

ifh.write(entry)

1131

ifh.write(entry)

1132

else:

1132

else:

1133

self._delay_buffer.append(entry)

1133

self._delay_buffer.append(entry)

1134

elif self._delay_buffer is not None:

1134

elif self._delay_buffer is not None:

1135

msg = b'invalid delayed write on inline revlog'

1135

msg = b'invalid delayed write on inline revlog'

1136

raise error.ProgrammingError(msg)

1136

raise error.ProgrammingError(msg)

1137

else:

1137

else:

1138

offset += curr * self.index.entry_size

1138

offset += curr * self.index.entry_size

1139

transaction.add(self.canonical_index_file, offset)

1139

transaction.add(self.canonical_index_file, offset)

1140

assert not sidedata

1140

assert not sidedata

1141

ifh.write(entry)

1141

ifh.write(entry)

1142

ifh.write(data[0])

1142

ifh.write(data[0])

1143

ifh.write(data[1])

1143

ifh.write(data[1])

1144

return (

1144

return (

1145

ifh.tell(),

1145

ifh.tell(),

1146

dfh.tell() if dfh else None,

1146

dfh.tell() if dfh else None,

1147

sdfh.tell() if sdfh else None,

1147

sdfh.tell() if sdfh else None,

1148

)

1148

)

1149

1150

def _divert_index(self):

1150

def _divert_index(self):

1151

return self.index_file + b'.a'

1151

return self.index_file + b'.a'

1152

1153

def delay(self):

1153

def delay(self):

1154

assert not self.is_open

1154

assert not self.is_open

1155

if self.inline:

1155

if self.inline:

1156

msg = "revlog with delayed write should not be inline"

1156

msg = "revlog with delayed write should not be inline"

1157

raise error.ProgrammingError(msg)

1157

raise error.ProgrammingError(msg)

1158

if self._delay_buffer is not None or self._orig_index_file is not None:

1158

if self._delay_buffer is not None or self._orig_index_file is not None:

1159

# delay or divert already in place

1159

# delay or divert already in place

1160

return None

1160

return None

1161

elif len(self.index) == 0:

1161

elif len(self.index) == 0:

1162

self._orig_index_file = self.index_file

1162

self._orig_index_file = self.index_file

1163

self.index_file = self._divert_index()

1163

self.index_file = self._divert_index()

1164

assert self._orig_index_file is not None

1164

assert self._orig_index_file is not None

1165

assert self.index_file is not None

1165

assert self.index_file is not None

1166

if self.opener.exists(self.index_file):

1166

if self.opener.exists(self.index_file):

1167

self.opener.unlink(self.index_file)

1167

self.opener.unlink(self.index_file)

1168

return self.index_file

1168

return self.index_file

1169

else:

1169

else:

1170

self._delay_buffer = []

1170

self._delay_buffer = []

1171

return None

1171

return None

1172

1173

def write_pending(self):

1173

def write_pending(self):

1174

assert not self.is_open

1174

assert not self.is_open

1175

if self.inline:

1175

if self.inline:

1176

msg = "revlog with delayed write should not be inline"

1176

msg = "revlog with delayed write should not be inline"

1177

raise error.ProgrammingError(msg)

1177

raise error.ProgrammingError(msg)

1178

if self._orig_index_file is not None:

1178

if self._orig_index_file is not None:

1179

return None, True

1179

return None, True

1180

any_pending = False

1180

any_pending = False

1181

pending_index_file = self._divert_index()

1181

pending_index_file = self._divert_index()

1182

if self.opener.exists(pending_index_file):

1182

if self.opener.exists(pending_index_file):

1183

self.opener.unlink(pending_index_file)

1183

self.opener.unlink(pending_index_file)

1184

util.copyfile(

1184

util.copyfile(

1185

self.opener.join(self.index_file),

1185

self.opener.join(self.index_file),

1186

self.opener.join(pending_index_file),

1186

self.opener.join(pending_index_file),

1187

)

1187

)

1188

if self._delay_buffer:

1188

if self._delay_buffer:

1189

with self.opener(pending_index_file, b'r+') as ifh:

1189

with self.opener(pending_index_file, b'r+') as ifh:

1190

ifh.seek(0, os.SEEK_END)

1190

ifh.seek(0, os.SEEK_END)

1191

ifh.write(b"".join(self._delay_buffer))

1191

ifh.write(b"".join(self._delay_buffer))

1192

any_pending = True

1192

any_pending = True

1193

self._delay_buffer = None

1193

self._delay_buffer = None

1194

self._orig_index_file = self.index_file

1194

self._orig_index_file = self.index_file

1195

self.index_file = pending_index_file

1195

self.index_file = pending_index_file

1196

return self.index_file, any_pending

1196

return self.index_file, any_pending

1197

1198

def finalize_pending(self):

1198

def finalize_pending(self):

1199

assert not self.is_open

1199

assert not self.is_open

1200

if self.inline:

1200

if self.inline:

1201

msg = "revlog with delayed write should not be inline"

1201

msg = "revlog with delayed write should not be inline"

1202

raise error.ProgrammingError(msg)

1202

raise error.ProgrammingError(msg)

1203

1204

delay = self._delay_buffer is not None

1204

delay = self._delay_buffer is not None

1205

divert = self._orig_index_file is not None

1205

divert = self._orig_index_file is not None

1206

1207

if delay and divert:

1207

if delay and divert:

1208

assert False, "unreachable"

1208

assert False, "unreachable"

1209

elif delay:

1209

elif delay:

1210

if self._delay_buffer:

1210

if self._delay_buffer:

1211

with self.opener(self.index_file, b'r+') as ifh:

1211

with self.opener(self.index_file, b'r+') as ifh:

1212

ifh.seek(0, os.SEEK_END)

1212

ifh.seek(0, os.SEEK_END)

1213

ifh.write(b"".join(self._delay_buffer))

1213

ifh.write(b"".join(self._delay_buffer))

1214

self._delay_buffer = None

1214

self._delay_buffer = None

1215

elif divert:

1215

elif divert:

1216

if self.opener.exists(self.index_file):

1216

if self.opener.exists(self.index_file):

1217

self.opener.rename(

1217

self.opener.rename(

1218

self.index_file,

1218

self.index_file,

1219

self._orig_index_file,

1219

self._orig_index_file,

1220

checkambig=True,

1220

checkambig=True,

1221

)

1221

)

1222

self.index_file = self._orig_index_file

1222

self.index_file = self._orig_index_file

1223

self._orig_index_file = None

1223

self._orig_index_file = None

1224

else:

1224

else:

1225

msg = b"not delay or divert found on this revlog"

1225

msg = b"not delay or divert found on this revlog"

1226

raise error.ProgrammingError(msg)

1226

raise error.ProgrammingError(msg)

1227

return self.canonical_index_file

1227

return self.canonical_index_file

1228

1229

1230

class revlog:

1230

class revlog:

1231

"""

1231

"""

1232

the underlying revision storage object

1232

the underlying revision storage object

1233

1234

A revlog consists of two parts, an index and the revision data.

1234

A revlog consists of two parts, an index and the revision data.

1235

1236

The index is a file with a fixed record size containing

1236

The index is a file with a fixed record size containing

1237

information on each revision, including its nodeid (hash), the

1237

information on each revision, including its nodeid (hash), the

1238

nodeids of its parents, the position and offset of its data within

1238

nodeids of its parents, the position and offset of its data within

1239

the data file, and the revision it's based on. Finally, each entry

1239

the data file, and the revision it's based on. Finally, each entry

1240

contains a linkrev entry that can serve as a pointer to external

1240

contains a linkrev entry that can serve as a pointer to external

1241

data.

1241

data.

1242

1243

The revision data itself is a linear collection of data chunks.

1243

The revision data itself is a linear collection of data chunks.

1244

Each chunk represents a revision and is usually represented as a

1244

Each chunk represents a revision and is usually represented as a

1245

delta against the previous chunk. To bound lookup time, runs of

1245

delta against the previous chunk. To bound lookup time, runs of

1246

deltas are limited to about 2 times the length of the original

1246

deltas are limited to about 2 times the length of the original

1247

version data. This makes retrieval of a version proportional to

1247

version data. This makes retrieval of a version proportional to

1248

its size, or O(1) relative to the number of revisions.

1248

its size, or O(1) relative to the number of revisions.

1249

1250

Both pieces of the revlog are written to in an append-only

1250

Both pieces of the revlog are written to in an append-only

1251

fashion, which means we never need to rewrite a file to insert or

1251

fashion, which means we never need to rewrite a file to insert or

1252

remove data, and can use some simple techniques to avoid the need

1252

remove data, and can use some simple techniques to avoid the need

1253

for locking while reading.

1253

for locking while reading.

1254

1255

If checkambig, indexfile is opened with checkambig=True at

1255

If checkambig, indexfile is opened with checkambig=True at

1256

writing, to avoid file stat ambiguity.

1256

writing, to avoid file stat ambiguity.

1257

1258

If mmaplargeindex is True, and an mmapindexthreshold is set, the

1258

If mmaplargeindex is True, and an mmapindexthreshold is set, the

1259

index will be mmapped rather than read if it is larger than the

1259

index will be mmapped rather than read if it is larger than the

1260

configured threshold.

1260

configured threshold.

1261

1262

If censorable is True, the revlog can have censored revisions.

1262

If censorable is True, the revlog can have censored revisions.

1263

1264

If `upperboundcomp` is not None, this is the expected maximal gain from

1264

If `upperboundcomp` is not None, this is the expected maximal gain from

1265

compression for the data content.

1265

compression for the data content.

1266

1267

`concurrencychecker` is an optional function that receives 3 arguments: a

1267

`concurrencychecker` is an optional function that receives 3 arguments: a

1268

file handle, a filename, and an expected position. It should check whether

1268

file handle, a filename, and an expected position. It should check whether

1269

the current position in the file handle is valid, and log/warn/fail (by

1269

the current position in the file handle is valid, and log/warn/fail (by

1270

raising).

1270

raising).

1271

1272

See mercurial/revlogutils/contants.py for details about the content of an

1272

See mercurial/revlogutils/contants.py for details about the content of an

1273

index entry.

1273

index entry.

1274

"""

1274

"""

1275

1276

_flagserrorclass = error.RevlogError

1276

_flagserrorclass = error.RevlogError

1277

1278

@staticmethod

1278

@staticmethod

1279

def is_inline_index(header_bytes):

1279

def is_inline_index(header_bytes):

1280

"""Determine if a revlog is inline from the initial bytes of the index"""

1280

"""Determine if a revlog is inline from the initial bytes of the index"""

1281

if len(header_bytes) == 0:

1281

if len(header_bytes) == 0:

1282

return True

1282

return True

1283

1284

header = INDEX_HEADER.unpack(header_bytes)[0]

1284

header = INDEX_HEADER.unpack(header_bytes)[0]

1285

1286

_format_flags = header & ~0xFFFF

1286

_format_flags = header & ~0xFFFF

1287

_format_version = header & 0xFFFF

1287

_format_version = header & 0xFFFF

1288

1289

features = FEATURES_BY_VERSION[_format_version]

1289

features = FEATURES_BY_VERSION[_format_version]

1290

return features[b'inline'](_format_flags)

1290

return features[b'inline'](_format_flags)

1291

1292

def __init__(

1292

def __init__(

1293

self,

1293

self,

1294

opener,

1294

opener,

1295

target,

1295

target,

1296

radix,

1296

radix,

1297

postfix=None, # only exist for `tmpcensored` now

1297

postfix=None, # only exist for `tmpcensored` now

1298

checkambig=False,

1298

checkambig=False,

1299

mmaplargeindex=False,

1299

mmaplargeindex=False,

1300

censorable=False,

1300

censorable=False,

1301

upperboundcomp=None,

1301

upperboundcomp=None,

1302

persistentnodemap=False,

1302

persistentnodemap=False,

1303

concurrencychecker=None,

1303

concurrencychecker=None,

1304

trypending=False,

1304

trypending=False,

1305

try_split=False,

1305

try_split=False,

1306

canonical_parent_order=True,

1306

canonical_parent_order=True,

1307

data_config=None,

1307

data_config=None,

1308

delta_config=None,

1308

delta_config=None,

1309

feature_config=None,

1309

feature_config=None,

1310

may_inline=True, # may inline new revlog

1310

may_inline=True, # may inline new revlog

1311

):

1311

):

1312

"""

1312

"""

1313

create a revlog object

1313

create a revlog object

1314

1315

opener is a function that abstracts the file opening operation

1315

opener is a function that abstracts the file opening operation

1316

and can be used to implement COW semantics or the like.

1316

and can be used to implement COW semantics or the like.

1317

1318

`target`: a (KIND, ID) tuple that identify the content stored in

1318

`target`: a (KIND, ID) tuple that identify the content stored in

1319

this revlog. It help the rest of the code to understand what the revlog

1319

this revlog. It help the rest of the code to understand what the revlog

1320

is about without having to resort to heuristic and index filename

1320

is about without having to resort to heuristic and index filename

1321

analysis. Note: that this must be reliably be set by normal code, but

1321

analysis. Note: that this must be reliably be set by normal code, but

1322

that test, debug, or performance measurement code might not set this to

1322

that test, debug, or performance measurement code might not set this to

1323

accurate value.

1323

accurate value.

1324

"""

1324

"""

1325

1326

self.radix = radix

1326

self.radix = radix

1327

1328

self._docket_file = None

1328

self._docket_file = None

1329

self._indexfile = None

1329

self._indexfile = None

1330

self._datafile = None

1330

self._datafile = None

1331

self._sidedatafile = None

1331

self._sidedatafile = None

1332

self._nodemap_file = None

1332

self._nodemap_file = None

1333

self.postfix = postfix

1333

self.postfix = postfix

1334

self._trypending = trypending

1334

self._trypending = trypending

1335

self._try_split = try_split

1335

self._try_split = try_split

1336

self._may_inline = may_inline

1336

self._may_inline = may_inline

1337

self.opener = opener

1337

self.opener = opener

1338

if persistentnodemap:

1338

if persistentnodemap:

1339

self._nodemap_file = nodemaputil.get_nodemap_file(self)

1339

self._nodemap_file = nodemaputil.get_nodemap_file(self)

1340

1341

assert target[0] in ALL_KINDS

1341

assert target[0] in ALL_KINDS

1342

assert len(target) == 2

1342

assert len(target) == 2

1343

self.target = target

1343

self.target = target

1344

if feature_config is not None:

1344

if feature_config is not None:

1345

self.feature_config = feature_config.copy()

1345

self.feature_config = feature_config.copy()

1346

elif b'feature-config' in self.opener.options:

1346

elif b'feature-config' in self.opener.options:

1347

self.feature_config = self.opener.options[b'feature-config'].copy()

1347

self.feature_config = self.opener.options[b'feature-config'].copy()

1348

else:

1348

else:

1349

self.feature_config = FeatureConfig()

1349

self.feature_config = FeatureConfig()

1350

self.feature_config.censorable = censorable

1350

self.feature_config.censorable = censorable

1351

self.feature_config.canonical_parent_order = canonical_parent_order

1351

self.feature_config.canonical_parent_order = canonical_parent_order

1352

if data_config is not None:

1352

if data_config is not None:

1353

self.data_config = data_config.copy()

1353

self.data_config = data_config.copy()

1354

elif b'data-config' in self.opener.options:

1354

elif b'data-config' in self.opener.options:

1355

self.data_config = self.opener.options[b'data-config'].copy()

1355

self.data_config = self.opener.options[b'data-config'].copy()

1356

else:

1356

else:

1357

self.data_config = DataConfig()

1357

self.data_config = DataConfig()

1358

self.data_config.check_ambig = checkambig

1358

self.data_config.check_ambig = checkambig

1359

self.data_config.mmap_large_index = mmaplargeindex

1359

self.data_config.mmap_large_index = mmaplargeindex

1360

if delta_config is not None:

1360

if delta_config is not None:

1361

self.delta_config = delta_config.copy()

1361

self.delta_config = delta_config.copy()

1362

elif b'delta-config' in self.opener.options:

1362

elif b'delta-config' in self.opener.options:

1363

self.delta_config = self.opener.options[b'delta-config'].copy()

1363

self.delta_config = self.opener.options[b'delta-config'].copy()

1364

else:

1364

else:

1365

self.delta_config = DeltaConfig()

1365

self.delta_config = DeltaConfig()

1366

self.delta_config.upper_bound_comp = upperboundcomp

1366

self.delta_config.upper_bound_comp = upperboundcomp

1367

1368

# Maps rev to chain base rev.

1368

# Maps rev to chain base rev.

1369

self._chainbasecache = util.lrucachedict(100)

1369

self._chainbasecache = util.lrucachedict(100)

1370

1371

self.index = None

1371

self.index = None

1372

self._docket = None

1372

self._docket = None

1373

self._nodemap_docket = None

1373

self._nodemap_docket = None

1374

# Mapping of partial identifiers to full nodes.

1374

# Mapping of partial identifiers to full nodes.

1375

self._pcache = {}

1375

self._pcache = {}

1376

1377

# other optionnals features

1377

# other optionnals features

1378

1379

# Make copy of flag processors so each revlog instance can support

1379

# Make copy of flag processors so each revlog instance can support

1380

# custom flags.

1380

# custom flags.

1381

self._flagprocessors = dict(flagutil.flagprocessors)

1381

self._flagprocessors = dict(flagutil.flagprocessors)

1382

# prevent nesting of addgroup

1382

# prevent nesting of addgroup

1383

self._adding_group = None

1383

self._adding_group = None

1384

1385

chunk_cache = self._loadindex()

1385

chunk_cache = self._loadindex()

1386

self._load_inner(chunk_cache)

1386

self._load_inner(chunk_cache)

1387

self._concurrencychecker = concurrencychecker

1387

self._concurrencychecker = concurrencychecker

1388

1389

def _init_opts(self):

1389

def _init_opts(self):

1390

"""process options (from above/config) to setup associated default revlog mode

1390

"""process options (from above/config) to setup associated default revlog mode

1391

1392

These values might be affected when actually reading on disk information.

1392

These values might be affected when actually reading on disk information.

1393

1394

The relevant values are returned for use in _loadindex().

1394

The relevant values are returned for use in _loadindex().

1395

1396

* newversionflags:

1396

* newversionflags:

1397

version header to use if we need to create a new revlog

1397

version header to use if we need to create a new revlog

1398

1399

* mmapindexthreshold:

1399

* mmapindexthreshold:

1400

minimal index size for start to use mmap

1400

minimal index size for start to use mmap

1401

1402

* force_nodemap:

1402

* force_nodemap:

1403

force the usage of a "development" version of the nodemap code

1403

force the usage of a "development" version of the nodemap code

1404

"""

1404

"""

1405

opts = self.opener.options

1405

opts = self.opener.options

1406

1407

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

1407

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

1408

new_header = CHANGELOGV2

1408

new_header = CHANGELOGV2

1409

compute_rank = opts.get(b'changelogv2.compute-rank', True)

1409

compute_rank = opts.get(b'changelogv2.compute-rank', True)

1410

self.feature_config.compute_rank = compute_rank

1410

self.feature_config.compute_rank = compute_rank

1411

elif b'revlogv2' in opts:

1411

elif b'revlogv2' in opts:

1412

new_header = REVLOGV2

1412

new_header = REVLOGV2

1413

elif b'revlogv1' in opts:

1413

elif b'revlogv1' in opts:

1414

new_header = REVLOGV1

1414

new_header = REVLOGV1

1415

if self._may_inline:

1415

if self._may_inline:

1416

new_header |= FLAG_INLINE_DATA

1416

new_header |= FLAG_INLINE_DATA

1417

if b'generaldelta' in opts:

1417

if b'generaldelta' in opts:

1418

new_header |= FLAG_GENERALDELTA

1418

new_header |= FLAG_GENERALDELTA

1419

elif b'revlogv0' in self.opener.options:

1419

elif b'revlogv0' in self.opener.options:

1420

new_header = REVLOGV0

1420

new_header = REVLOGV0

1421

else:

1421

else:

1422

new_header = REVLOG_DEFAULT_VERSION

1422

new_header = REVLOG_DEFAULT_VERSION

1423

1424

mmapindexthreshold = None

1424

mmapindexthreshold = None

1425

if self.data_config.mmap_large_index:

1425

if self.data_config.mmap_large_index:

1426

mmapindexthreshold = self.data_config.mmap_index_threshold

1426

mmapindexthreshold = self.data_config.mmap_index_threshold

1427

if self.feature_config.enable_ellipsis:

1427

if self.feature_config.enable_ellipsis:

1428

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

1428

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

1429

1430

# revlog v0 doesn't have flag processors

1430

# revlog v0 doesn't have flag processors

1431

for flag, processor in opts.get(b'flagprocessors', {}).items():

1431

for flag, processor in opts.get(b'flagprocessors', {}).items():

1432

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

1432

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

1433

1434

chunk_cache_size = self.data_config.chunk_cache_size

1434

chunk_cache_size = self.data_config.chunk_cache_size

1435

if chunk_cache_size <= 0:

1435

if chunk_cache_size <= 0:

1436

raise error.RevlogError(

1436

raise error.RevlogError(

1437

_(b'revlog chunk cache size %r is not greater than 0')

1437

_(b'revlog chunk cache size %r is not greater than 0')

1438

% chunk_cache_size

1438

% chunk_cache_size

1439

)

1439

)

1440

elif chunk_cache_size & (chunk_cache_size - 1):

1440

elif chunk_cache_size & (chunk_cache_size - 1):

1441

raise error.RevlogError(

1441

raise error.RevlogError(

1442

_(b'revlog chunk cache size %r is not a power of 2')

1442

_(b'revlog chunk cache size %r is not a power of 2')

1443

% chunk_cache_size

1443

% chunk_cache_size

1444

)

1444

)

1445

force_nodemap = opts.get(b'devel-force-nodemap', False)

1445

force_nodemap = opts.get(b'devel-force-nodemap', False)

1446

return new_header, mmapindexthreshold, force_nodemap

1446

return new_header, mmapindexthreshold, force_nodemap

1447

1448

def _get_data(self, filepath, mmap_threshold, size=None):

1448

def _get_data(self, filepath, mmap_threshold, size=None):

1449

"""return a file content with or without mmap

1449

"""return a file content with or without mmap

1450

1451

If the file is missing return the empty string"""

1451

If the file is missing return the empty string"""

1452

try:

1452

try:

1453

with self.opener(filepath) as fp:

1453

with self.opener(filepath) as fp:

1454

if mmap_threshold is not None:

1454

if mmap_threshold is not None:

1455

file_size = self.opener.fstat(fp).st_size

1455

file_size = self.opener.fstat(fp).st_size

1456

if file_size >= mmap_threshold:

1456

if file_size >= mmap_threshold:

1457

if size is not None:

1457

if size is not None:

1458

# avoid potentiel mmap crash

1458

# avoid potentiel mmap crash

1459

size = min(file_size, size)

1459

size = min(file_size, size)

1460

# TODO: should .close() to release resources without

1460

# TODO: should .close() to release resources without

1461

# relying on Python GC

1461

# relying on Python GC

1462

if size is None:

1462

if size is None:

1463

return util.buffer(util.mmapread(fp))

1463

return util.buffer(util.mmapread(fp))

1464

else:

1464

else:

1465

return util.buffer(util.mmapread(fp, size))

1465

return util.buffer(util.mmapread(fp, size))

1466

if size is None:

1466

if size is None:

1467

return fp.read()

1467

return fp.read()

1468

else:

1468

else:

1469

return fp.read(size)

1469

return fp.read(size)

1470

except FileNotFoundError:

1470

except FileNotFoundError:

1471

return b''

1471

return b''

1472

1473

def get_streams(self, max_linkrev, force_inline=False):

1473

def get_streams(self, max_linkrev, force_inline=False):

1474

"""return a list of streams that represent this revlog

1474

"""return a list of streams that represent this revlog

1475

1476

This is used by stream-clone to do bytes to bytes copies of a repository.

1476

This is used by stream-clone to do bytes to bytes copies of a repository.

1477

1478

This streams data for all revisions that refer to a changelog revision up

1478

This streams data for all revisions that refer to a changelog revision up

1479

to `max_linkrev`.

1479

to `max_linkrev`.

1480

1481

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

1481

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

1482

1483

It returns is a list of three-tuple:

1483

It returns is a list of three-tuple:

1484

1485

[

1485

[

1486

(filename, bytes_stream, stream_size),

1486

(filename, bytes_stream, stream_size),

1487

…

1487

…

1488

]

1488

]

1489

"""

1489

"""

1490

n = len(self)

1490

n = len(self)

1491

index = self.index

1491

index = self.index

1492

while n > 0:

1492

while n > 0:

1493

linkrev = index[n - 1][4]

1493

linkrev = index[n - 1][4]

1494

if linkrev < max_linkrev:

1494

if linkrev < max_linkrev:

1495

break

1495

break

1496

# note: this loop will rarely go through multiple iterations, since

1496

# note: this loop will rarely go through multiple iterations, since

1497

# it only traverses commits created during the current streaming

1497

# it only traverses commits created during the current streaming

1498

# pull operation.

1498

# pull operation.

1499

#

1499

#

1500

# If this become a problem, using a binary search should cap the

1500

# If this become a problem, using a binary search should cap the

1501

# runtime of this.

1501

# runtime of this.

1502

n = n - 1

1502

n = n - 1

1503

if n == 0:

1503

if n == 0:

1504

# no data to send

1504

# no data to send

1505

return []

1505

return []

1506

index_size = n * index.entry_size

1506

index_size = n * index.entry_size

1507

data_size = self.end(n - 1)

1507

data_size = self.end(n - 1)

1508

1509

# XXX we might have been split (or stripped) since the object

1509

# XXX we might have been split (or stripped) since the object

1510

# initialization, We need to close this race too, but having a way to

1510

# initialization, We need to close this race too, but having a way to

1511

# pre-open the file we feed to the revlog and never closing them before

1511

# pre-open the file we feed to the revlog and never closing them before

1512

# we are done streaming.

1512

# we are done streaming.

1513

1514

if self._inline:

1514

if self._inline:

1515

1516

def get_stream():

1516

def get_stream():

1517

with self.opener(self._indexfile, mode=b"r") as fp:

1517

with self.opener(self._indexfile, mode=b"r") as fp:

1518

yield None

1518

yield None

1519

size = index_size + data_size

1519

size = index_size + data_size

1520

if size <= 65536:

1520

if size <= 65536:

1521

yield fp.read(size)

1521

yield fp.read(size)

1522

else:

1522

else:

1523

yield from util.filechunkiter(fp, limit=size)

1523

yield from util.filechunkiter(fp, limit=size)

1524

1525

inline_stream = get_stream()

1525

inline_stream = get_stream()

1526

next(inline_stream)

1526

next(inline_stream)

1527

return [

1527

return [

1528

(self._indexfile, inline_stream, index_size + data_size),

1528

(self._indexfile, inline_stream, index_size + data_size),

1529

]

1529

]

1530

elif force_inline:

1530

elif force_inline:

1531

1532

def get_stream():

1532

def get_stream():

1533

with self.reading():

1533

with self.reading():

1534

yield None

1534

yield None

1535

1536

for rev in range(n):

1536

for rev in range(n):

1537

idx = self.index.entry_binary(rev)

1537

idx = self.index.entry_binary(rev)

1538

if rev == 0 and self._docket is None:

1538

if rev == 0 and self._docket is None:

1539

# re-inject the inline flag

1539

# re-inject the inline flag

1540

header = self._format_flags

1540

header = self._format_flags

1541

header |= self._format_version

1541

header |= self._format_version

1542

header |= FLAG_INLINE_DATA

1542

header |= FLAG_INLINE_DATA

1543

header = self.index.pack_header(header)

1543

header = self.index.pack_header(header)

1544

idx = header + idx

1544

idx = header + idx

1545

yield idx

1545

yield idx

1546

yield self._inner.get_segment_for_revs(rev, rev)[1]

1546

yield self._inner.get_segment_for_revs(rev, rev)[1]

1547

1548

inline_stream = get_stream()

1548

inline_stream = get_stream()

1549

next(inline_stream)

1549

next(inline_stream)

1550

return [

1550

return [

1551

(self._indexfile, inline_stream, index_size + data_size),

1551

(self._indexfile, inline_stream, index_size + data_size),

1552

]

1552

]

1553

else:

1553

else:

1554

1555

def get_index_stream():

1555

def get_index_stream():

1556

with self.opener(self._indexfile, mode=b"r") as fp:

1556

with self.opener(self._indexfile, mode=b"r") as fp:

1557

yield None

1557

yield None

1558

if index_size <= 65536:

1558

if index_size <= 65536:

1559

yield fp.read(index_size)

1559

yield fp.read(index_size)

1560

else:

1560

else:

1561

yield from util.filechunkiter(fp, limit=index_size)

1561

yield from util.filechunkiter(fp, limit=index_size)

1562

1563

def get_data_stream():

1563

def get_data_stream():

1564

with self._datafp() as fp:

1564

with self._datafp() as fp:

1565

yield None

1565

yield None

1566

if data_size <= 65536:

1566

if data_size <= 65536:

1567

yield fp.read(data_size)

1567

yield fp.read(data_size)

1568

else:

1568

else:

1569

yield from util.filechunkiter(fp, limit=data_size)

1569

yield from util.filechunkiter(fp, limit=data_size)

1570

1571

index_stream = get_index_stream()

1571

index_stream = get_index_stream()

1572

next(index_stream)

1572

next(index_stream)

1573

data_stream = get_data_stream()

1573

data_stream = get_data_stream()

1574

next(data_stream)

1574

next(data_stream)

1575

return [

1575

return [

1576

(self._datafile, data_stream, data_size),

1576

(self._datafile, data_stream, data_size),

1577

(self._indexfile, index_stream, index_size),

1577

(self._indexfile, index_stream, index_size),

1578

]

1578

]

1579

1580

def _loadindex(self, docket=None):

1580

def _loadindex(self, docket=None):

1581

1582

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

1582

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

1583

1584

if self.postfix is not None:

1584

if self.postfix is not None:

1585

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

1585

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

1586

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

1586

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

1587

entry_point = b'%s.i.a' % self.radix

1587

entry_point = b'%s.i.a' % self.radix

1588

elif self._try_split and self.opener.exists(self._split_index_file):

1588

elif self._try_split and self.opener.exists(self._split_index_file):

1589

entry_point = self._split_index_file

1589

entry_point = self._split_index_file

1590

else:

1590

else:

1591

entry_point = b'%s.i' % self.radix

1591

entry_point = b'%s.i' % self.radix

1592

1593

if docket is not None:

1593

if docket is not None:

1594

self._docket = docket

1594

self._docket = docket

1595

self._docket_file = entry_point

1595

self._docket_file = entry_point

1596

else:

1596

else:

1597

self._initempty = True

1597

self._initempty = True

1598

entry_data = self._get_data(entry_point, mmapindexthreshold)

1598

entry_data = self._get_data(entry_point, mmapindexthreshold)

1599

if len(entry_data) > 0:

1599

if len(entry_data) > 0:

1600

header = INDEX_HEADER.unpack(entry_data[:4])[0]

1600

header = INDEX_HEADER.unpack(entry_data[:4])[0]

1601

self._initempty = False

1601

self._initempty = False

1602

else:

1602

else:

1603

header = new_header

1603

header = new_header

1604

1605

self._format_flags = header & ~0xFFFF

1605

self._format_flags = header & ~0xFFFF

1606

self._format_version = header & 0xFFFF

1606

self._format_version = header & 0xFFFF

1607

1608

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

1608

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

1609

if supported_flags is None:

1609

if supported_flags is None:

1610

msg = _(b'unknown version (%d) in revlog %s')

1610

msg = _(b'unknown version (%d) in revlog %s')

1611

msg %= (self._format_version, self.display_id)

1611

msg %= (self._format_version, self.display_id)

1612

raise error.RevlogError(msg)

1612

raise error.RevlogError(msg)

1613

elif self._format_flags & ~supported_flags:

1613

elif self._format_flags & ~supported_flags:

1614

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

1614

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

1615

display_flag = self._format_flags >> 16

1615

display_flag = self._format_flags >> 16

1616

msg %= (display_flag, self._format_version, self.display_id)

1616

msg %= (display_flag, self._format_version, self.display_id)

1617

raise error.RevlogError(msg)

1617

raise error.RevlogError(msg)

1618

1619

features = FEATURES_BY_VERSION[self._format_version]

1619

features = FEATURES_BY_VERSION[self._format_version]

1620

self._inline = features[b'inline'](self._format_flags)

1620

self._inline = features[b'inline'](self._format_flags)

1621

self.delta_config.general_delta = features[b'generaldelta'](

1621

self.delta_config.general_delta = features[b'generaldelta'](

1622

self._format_flags

1622

self._format_flags

1623

)

1623

)

1624

self.feature_config.has_side_data = features[b'sidedata']

1624

self.feature_config.has_side_data = features[b'sidedata']

1625

1626

if not features[b'docket']:

1626

if not features[b'docket']:

1627

self._indexfile = entry_point

1627

self._indexfile = entry_point

1628

index_data = entry_data

1628

index_data = entry_data

1629

else:

1629

else:

1630

self._docket_file = entry_point

1630

self._docket_file = entry_point

1631

if self._initempty:

1631

if self._initempty:

1632

self._docket = docketutil.default_docket(self, header)

1632

self._docket = docketutil.default_docket(self, header)

1633

else:

1633

else:

1634

self._docket = docketutil.parse_docket(

1634

self._docket = docketutil.parse_docket(

1635

self, entry_data, use_pending=self._trypending

1635

self, entry_data, use_pending=self._trypending

1636

)

1636

)

1637

1638

if self._docket is not None:

1638

if self._docket is not None:

1639

self._indexfile = self._docket.index_filepath()

1639

self._indexfile = self._docket.index_filepath()

1640

index_data = b''

1640

index_data = b''

1641

index_size = self._docket.index_end

1641

index_size = self._docket.index_end

1642

if index_size > 0:

1642

if index_size > 0:

1643

index_data = self._get_data(

1643

index_data = self._get_data(

1644

self._indexfile, mmapindexthreshold, size=index_size

1644

self._indexfile, mmapindexthreshold, size=index_size

1645

)

1645

)

1646

if len(index_data) < index_size:

1646

if len(index_data) < index_size:

1647

msg = _(b'too few index data for %s: got %d, expected %d')

1647

msg = _(b'too few index data for %s: got %d, expected %d')

1648

msg %= (self.display_id, len(index_data), index_size)

1648

msg %= (self.display_id, len(index_data), index_size)

1649

raise error.RevlogError(msg)

1649

raise error.RevlogError(msg)

1650

1651

self._inline = False

1651

self._inline = False

1652

# generaldelta implied by version 2 revlogs.

1652

# generaldelta implied by version 2 revlogs.

1653

self.delta_config.general_delta = True

1653

self.delta_config.general_delta = True

1654

# the logic for persistent nodemap will be dealt with within the

1654

# the logic for persistent nodemap will be dealt with within the

1655

# main docket, so disable it for now.

1655

# main docket, so disable it for now.

1656

self._nodemap_file = None

1656

self._nodemap_file = None

1657

1658

if self._docket is not None:

1658

if self._docket is not None:

1659

self._datafile = self._docket.data_filepath()

1659

self._datafile = self._docket.data_filepath()

1660

self._sidedatafile = self._docket.sidedata_filepath()

1660

self._sidedatafile = self._docket.sidedata_filepath()

1661

elif self.postfix is None:

1661

elif self.postfix is None:

1662

self._datafile = b'%s.d' % self.radix

1662

self._datafile = b'%s.d' % self.radix

1663

else:

1663

else:

1664

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

1664

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

1665

1666

self.nodeconstants = sha1nodeconstants

1666

self.nodeconstants = sha1nodeconstants

1667

self.nullid = self.nodeconstants.nullid

1667

self.nullid = self.nodeconstants.nullid

1668

1669

# sparse-revlog can't be on without general-delta (issue6056)

1669

# sparse-revlog can't be on without general-delta (issue6056)

1670

if not self.delta_config.general_delta:

1670

if not self.delta_config.general_delta:

1671

self.delta_config.sparse_revlog = False

1671

self.delta_config.sparse_revlog = False

1672

1673

self._storedeltachains = True

1673

self._storedeltachains = True

1674

1675

devel_nodemap = (

1675

devel_nodemap = (

1676

self._nodemap_file

1676

self._nodemap_file

1677

and force_nodemap

1677

and force_nodemap

1678

and parse_index_v1_nodemap is not None

1678

and parse_index_v1_nodemap is not None

1679

)

1679

)

1680

1681

use_rust_index = False

1681

use_rust_index = False

1682

if rustrevlog is not None:

1682

if rustrevlog is not None:

1683

if self._nodemap_file is not None:

1683

if self._nodemap_file is not None:

1684

use_rust_index = True

1684

use_rust_index = True

1685

else:

1685

else:

1686

# Using the CIndex is not longer possible, as the

1686

# Using the CIndex is not longer possible, as the

1687

# `AncestorsIterator` and `LazyAncestors` classes now require

1687

# `AncestorsIterator` and `LazyAncestors` classes now require

1688

# a Rust index for instantiation.

1688

# a Rust index for instantiation.

1689

use_rust_index = True

1689

use_rust_index = True

1690

1691

self._parse_index = parse_index_v1

1691

self._parse_index = parse_index_v1

1692

if self._format_version == REVLOGV0:

1692

if self._format_version == REVLOGV0:

1693

self._parse_index = revlogv0.parse_index_v0

1693

self._parse_index = revlogv0.parse_index_v0

1694

elif self._format_version == REVLOGV2:

1694

elif self._format_version == REVLOGV2:

1695

self._parse_index = parse_index_v2

1695

self._parse_index = parse_index_v2

1696

elif self._format_version == CHANGELOGV2:

1696

elif self._format_version == CHANGELOGV2:

1697

self._parse_index = parse_index_cl_v2

1697

self._parse_index = parse_index_cl_v2

1698

elif devel_nodemap:

1698

elif devel_nodemap:

1699

self._parse_index = parse_index_v1_nodemap

1699

self._parse_index = parse_index_v1_nodemap

1700

elif use_rust_index:

1700

elif use_rust_index:

1701

self._parse_index = functools.partial(

1701

self._parse_index = functools.partial(

1702

parse_index_v1_rust, default_header=new_header

1702

parse_index_v1_rust, default_header=new_header

1703

)

1703

)

1704

try:

1704

try:

1705

d = self._parse_index(index_data, self._inline)

1705

d = self._parse_index(index_data, self._inline)

1706

index, chunkcache = d

1706

index, chunkcache = d

1707

use_nodemap = (

1707

use_nodemap = (

1708

not self._inline

1708

not self._inline

1709

and self._nodemap_file is not None

1709

and self._nodemap_file is not None

1710

and hasattr(index, 'update_nodemap_data')

1710

and hasattr(index, 'update_nodemap_data')

1711

)

1711

)

1712

if use_nodemap:

1712

if use_nodemap:

1713

nodemap_data = nodemaputil.persisted_data(self)

1713

nodemap_data = nodemaputil.persisted_data(self)

1714

if nodemap_data is not None:

1714

if nodemap_data is not None:

1715

docket = nodemap_data[0]

1715

docket = nodemap_data[0]

1716

if (

1716

if (

1717

len(d[0]) > docket.tip_rev

1717

len(d[0]) > docket.tip_rev

1718

and d[0][docket.tip_rev][7] == docket.tip_node

1718

and d[0][docket.tip_rev][7] == docket.tip_node

1719

):

1719

):

1720

# no changelog tampering

1720

# no changelog tampering

1721

self._nodemap_docket = docket

1721

self._nodemap_docket = docket

1722

index.update_nodemap_data(*nodemap_data)

1722

index.update_nodemap_data(*nodemap_data)

1723

except (ValueError, IndexError):

1723

except (ValueError, IndexError):

1724

raise error.RevlogError(

1724

raise error.RevlogError(

1725

_(b"index %s is corrupted") % self.display_id

1725

_(b"index %s is corrupted") % self.display_id

1726

)

1726

)

1727

self.index = index

1727

self.index = index

1728

# revnum -> (chain-length, sum-delta-length)

1728

# revnum -> (chain-length, sum-delta-length)

1729

self._chaininfocache = util.lrucachedict(500)

1729

self._chaininfocache = util.lrucachedict(500)

1730

1731

return chunkcache

1731

return chunkcache

1732

1733

def _load_inner(self, chunk_cache):

1733

def _load_inner(self, chunk_cache):

1734

if self._docket is None:

1734

if self._docket is None:

1735

default_compression_header = None

1735

default_compression_header = None

1736

else:

1736

else:

1737

default_compression_header = self._docket.default_compression_header

1737

default_compression_header = self._docket.default_compression_header

1738

1739

self._inner = _InnerRevlog(

1739

self._inner = _InnerRevlog(

1740

opener=self.opener,

1740

opener=self.opener,

1741

index=self.index,

1741

index=self.index,

1742

index_file=self._indexfile,

1742

index_file=self._indexfile,

1743

data_file=self._datafile,

1743

data_file=self._datafile,

1744

sidedata_file=self._sidedatafile,

1744

sidedata_file=self._sidedatafile,

1745

inline=self._inline,

1745

inline=self._inline,

1746

data_config=self.data_config,

1746

data_config=self.data_config,

1747

delta_config=self.delta_config,

1747

delta_config=self.delta_config,

1748

feature_config=self.feature_config,

1748

feature_config=self.feature_config,

1749

chunk_cache=chunk_cache,

1749

chunk_cache=chunk_cache,

1750

default_compression_header=default_compression_header,

1750

default_compression_header=default_compression_header,

1751

)

1751

)

1752

1753

def get_revlog(self):

1753

def get_revlog(self):

1754

"""simple function to mirror API of other not-really-revlog API"""

1754

"""simple function to mirror API of other not-really-revlog API"""

1755

return self

1755

return self

1756

1757

@util.propertycache

1757

@util.propertycache

1758

def revlog_kind(self):

1758

def revlog_kind(self):

1759

return self.target[0]

1759

return self.target[0]

1760

1761

@util.propertycache

1761

@util.propertycache

1762

def display_id(self):

1762

def display_id(self):

1763

"""The public facing "ID" of the revlog that we use in message"""

1763

"""The public facing "ID" of the revlog that we use in message"""

1764

if self.revlog_kind == KIND_FILELOG:

1764

if self.revlog_kind == KIND_FILELOG:

1765

# Reference the file without the "data/" prefix, so it is familiar

1765

# Reference the file without the "data/" prefix, so it is familiar

1766

# to the user.

1766

# to the user.

1767

return self.target[1]

1767

return self.target[1]

1768

else:

1768

else:

1769

return self.radix

1769

return self.radix

1770

1771

def _datafp(self, mode=b'r'):

1771

def _datafp(self, mode=b'r'):

1772

"""file object for the revlog's data file"""

1772

"""file object for the revlog's data file"""

1773

return self.opener(self._datafile, mode=mode)

1773

return self.opener(self._datafile, mode=mode)

1774

1775

def tiprev(self):

1775

def tiprev(self):

1776

return len(self.index) - 1

1776

return len(self.index) - 1

1777

1778

def tip(self):

1778

def tip(self):

1779

return self.node(self.tiprev())

1779

return self.node(self.tiprev())

1780

1781

def __contains__(self, rev):

1781

def __contains__(self, rev):

1782

return 0 <= rev < len(self)

1782

return 0 <= rev < len(self)

1783

1784

def __len__(self):

1784

def __len__(self):

1785

return len(self.index)

1785

return len(self.index)

1786

1787

def __iter__(self):

1787

def __iter__(self):

1788

return iter(range(len(self)))

1788

return iter(range(len(self)))

1789

1790

def revs(self, start=0, stop=None):

1790

def revs(self, start=0, stop=None):

1791

"""iterate over all rev in this revlog (from start to stop)"""

1791

"""iterate over all rev in this revlog (from start to stop)"""

1792

return storageutil.iterrevs(len(self), start=start, stop=stop)

1792

return storageutil.iterrevs(len(self), start=start, stop=stop)

1793

1794

def hasnode(self, node):

1794

def hasnode(self, node):

1795

try:

1795

try:

1796

self.rev(node)

1796

self.rev(node)

1797

return True

1797

return True

1798

except KeyError:

1798

except KeyError:

1799

return False

1799

return False

1800

1801

def _candelta(self, baserev, rev):

1801

def _candelta(self, baserev, rev):

1802

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1802

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1803

# Disable delta if either rev requires a content-changing flag

1803

# Disable delta if either rev requires a content-changing flag

1804

# processor (ex. LFS). This is because such flag processor can alter

1804

# processor (ex. LFS). This is because such flag processor can alter

1805

# the rawtext content that the delta will be based on, and two clients

1805

# the rawtext content that the delta will be based on, and two clients

1806

# could have a same revlog node with different flags (i.e. different

1806

# could have a same revlog node with different flags (i.e. different

1807

# rawtext contents) and the delta could be incompatible.

1807

# rawtext contents) and the delta could be incompatible.

1808

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1808

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1809

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1809

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1810

):

1810

):

1811

return False

1811

return False

1812

return True

1812

return True

1813

1814

def update_caches(self, transaction):

1814

def update_caches(self, transaction):

1815

"""update on disk cache

1815

"""update on disk cache

1816

1817

If a transaction is passed, the update may be delayed to transaction

1817

If a transaction is passed, the update may be delayed to transaction

1818

commit."""

1818

commit."""

1819

if self._nodemap_file is not None:

1819

if self._nodemap_file is not None:

1820

if transaction is None:

1820

if transaction is None:

1821

nodemaputil.update_persistent_nodemap(self)

1821

nodemaputil.update_persistent_nodemap(self)

1822

else:

1822

else:

1823

nodemaputil.setup_persistent_nodemap(transaction, self)

1823

nodemaputil.setup_persistent_nodemap(transaction, self)

1824

1825

def clearcaches(self):

1825

def clearcaches(self):

1826

"""Clear in-memory caches"""

1826

"""Clear in-memory caches"""

1827

self._chainbasecache.clear()

1827

self._chainbasecache.clear()

1828

self._inner.clear_cache()

1828

self._inner.clear_cache()

1829

self._pcache = {}

1829

self._pcache = {}

1830

self._nodemap_docket = None

1830

self._nodemap_docket = None

1831

self.index.clearcaches()

1831

self.index.clearcaches()

1832

# The python code is the one responsible for validating the docket, we

1832

# The python code is the one responsible for validating the docket, we

1833

# end up having to refresh it here.

1833

# end up having to refresh it here.

1834

use_nodemap = (

1834

use_nodemap = (

1835

not self._inline

1835

not self._inline

1836

and self._nodemap_file is not None

1836

and self._nodemap_file is not None

1837

and hasattr(self.index, 'update_nodemap_data')

1837

and hasattr(self.index, 'update_nodemap_data')

1838

)

1838

)

1839

if use_nodemap:

1839

if use_nodemap:

1840

nodemap_data = nodemaputil.persisted_data(self)

1840

nodemap_data = nodemaputil.persisted_data(self)

1841

if nodemap_data is not None:

1841

if nodemap_data is not None:

1842

self._nodemap_docket = nodemap_data[0]

1842

self._nodemap_docket = nodemap_data[0]

1843

self.index.update_nodemap_data(*nodemap_data)

1843

self.index.update_nodemap_data(*nodemap_data)

1844

1845

def rev(self, node):

1845

def rev(self, node):

1846

"""return the revision number associated with a <nodeid>"""

1846

"""return the revision number associated with a <nodeid>"""

1847

try:

1847

try:

1848

return self.index.rev(node)

1848

return self.index.rev(node)

1849

except TypeError:

1849

except TypeError:

1850

raise

1850

raise

1851

except error.RevlogError:

1851

except error.RevlogError:

1852

# parsers.c radix tree lookup failed

1852

# parsers.c radix tree lookup failed

1853

if (

1853

if (

1854

node == self.nodeconstants.wdirid

1854

node == self.nodeconstants.wdirid

1855

or node in self.nodeconstants.wdirfilenodeids

1855

or node in self.nodeconstants.wdirfilenodeids

1856

):

1856

):

1857

raise error.WdirUnsupported

1857

raise error.WdirUnsupported

1858

raise error.LookupError(node, self.display_id, _(b'no node'))

1858

raise error.LookupError(node, self.display_id, _(b'no node'))

1859

1860

# Accessors for index entries.

1860

# Accessors for index entries.

1861

1862

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1862

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1863

# are flags.

1863

# are flags.

1864

def start(self, rev):

1864

def start(self, rev):

1865

return int(self.index[rev][0] >> 16)

1865

return int(self.index[rev][0] >> 16)

1866

1867

def sidedata_cut_off(self, rev):

1867

def sidedata_cut_off(self, rev):

1868

sd_cut_off = self.index[rev][8]

1868

sd_cut_off = self.index[rev][8]

1869

if sd_cut_off != 0:

1869

if sd_cut_off != 0:

1870

return sd_cut_off

1870

return sd_cut_off

1871

# This is some annoying dance, because entries without sidedata

1871

# This is some annoying dance, because entries without sidedata

1872

# currently use 0 as their ofsset. (instead of previous-offset +

1872

# currently use 0 as their ofsset. (instead of previous-offset +

1873

# previous-size)

1873

# previous-size)

1874

#

1874

#

1875

# We should reconsider this sidedata → 0 sidata_offset policy.

1875

# We should reconsider this sidedata → 0 sidata_offset policy.

1876

# In the meantime, we need this.

1876

# In the meantime, we need this.

1877

while 0 <= rev:

1877

while 0 <= rev:

1878

e = self.index[rev]

1878

e = self.index[rev]

1879

if e[9] != 0:

1879

if e[9] != 0:

1880

return e[8] + e[9]

1880

return e[8] + e[9]

1881

rev -= 1

1881

rev -= 1

1882

return 0

1882

return 0

1883

1884

def flags(self, rev):

1884

def flags(self, rev):

1885

return self.index[rev][0] & 0xFFFF

1885

return self.index[rev][0] & 0xFFFF

1886

1887

def length(self, rev):

1887

def length(self, rev):

1888

return self.index[rev][1]

1888

return self.index[rev][1]

1889

1890

def sidedata_length(self, rev):

1890

def sidedata_length(self, rev):

1891

if not self.feature_config.has_side_data:

1891

if not self.feature_config.has_side_data:

1892

return 0

1892

return 0

1893

return self.index[rev][9]

1893

return self.index[rev][9]

1894

1895

def rawsize(self, rev):

1895

def rawsize(self, rev):

1896

"""return the length of the uncompressed text for a given revision"""

1896

"""return the length of the uncompressed text for a given revision"""

1897

l = self.index[rev][2]

1897

l = self.index[rev][2]

1898

if l >= 0:

1898

if l >= 0:

1899

return l

1899

return l

1900

1901

t = self.rawdata(rev)

1901

t = self.rawdata(rev)

1902

return len(t)

1902

return len(t)

1903

1904

def size(self, rev):

1904

def size(self, rev):

1905

"""length of non-raw text (processed by a "read" flag processor)"""

1905

"""length of non-raw text (processed by a "read" flag processor)"""

1906

# fast path: if no "read" flag processor could change the content,

1906

# fast path: if no "read" flag processor could change the content,

1907

# size is rawsize. note: ELLIPSIS is known to not change the content.

1907

# size is rawsize. note: ELLIPSIS is known to not change the content.

1908

flags = self.flags(rev)

1908

flags = self.flags(rev)

1909

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1909

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1910

return self.rawsize(rev)

1910

return self.rawsize(rev)

1911

1912

return len(self.revision(rev))

1912

return len(self.revision(rev))

1913

1914

def fast_rank(self, rev):

1914

def fast_rank(self, rev):

1915

"""Return the rank of a revision if already known, or None otherwise.

1915

"""Return the rank of a revision if already known, or None otherwise.

1916

1917

The rank of a revision is the size of the sub-graph it defines as a

1917

The rank of a revision is the size of the sub-graph it defines as a

1918

head. Equivalently, the rank of a revision `r` is the size of the set

1918

head. Equivalently, the rank of a revision `r` is the size of the set

1919

`ancestors(r)`, `r` included.

1919

`ancestors(r)`, `r` included.

1920

1921

This method returns the rank retrieved from the revlog in constant

1921

This method returns the rank retrieved from the revlog in constant

1922

time. It makes no attempt at computing unknown values for versions of

1922

time. It makes no attempt at computing unknown values for versions of

1923

the revlog which do not persist the rank.

1923

the revlog which do not persist the rank.

1924

"""

1924

"""

1925

rank = self.index[rev][ENTRY_RANK]

1925

rank = self.index[rev][ENTRY_RANK]

1926

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1926

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1927

return None

1927

return None

1928

if rev == nullrev:

1928

if rev == nullrev:

1929

return 0 # convention

1929

return 0 # convention

1930

return rank

1930

return rank

1931

1932

def chainbase(self, rev):

1932

def chainbase(self, rev):

1933

base = self._chainbasecache.get(rev)

1933

base = self._chainbasecache.get(rev)

1934

if base is not None:

1934

if base is not None:

1935

return base

1935

return base

1936

1937

index = self.index

1937

index = self.index

1938

iterrev = rev

1938

iterrev = rev

1939

base = index[iterrev][3]

1939

base = index[iterrev][3]

1940

while base != iterrev:

1940

while base != iterrev:

1941

iterrev = base

1941

iterrev = base

1942

base = index[iterrev][3]

1942

base = index[iterrev][3]

1943

1944

self._chainbasecache[rev] = base

1944

self._chainbasecache[rev] = base

1945

return base

1945

return base

1946

1947

def linkrev(self, rev):

1947

def linkrev(self, rev):

1948

return self.index[rev][4]

1948

return self.index[rev][4]

1949

1950

def parentrevs(self, rev):

1950

def parentrevs(self, rev):

1951

try:

1951

try:

1952

entry = self.index[rev]

1952

entry = self.index[rev]

1953

except IndexError:

1953

except IndexError:

1954

if rev == wdirrev:

1954

if rev == wdirrev:

1955

raise error.WdirUnsupported

1955

raise error.WdirUnsupported

1956

raise

1956

raise

1957

1958

if self.feature_config.canonical_parent_order and entry[5] == nullrev:

1958

if self.feature_config.canonical_parent_order and entry[5] == nullrev:

1959

return entry[6], entry[5]

1959

return entry[6], entry[5]

1960

else:

1960

else:

1961

return entry[5], entry[6]

1961

return entry[5], entry[6]

1962

1963

# fast parentrevs(rev) where rev isn't filtered

1963

# fast parentrevs(rev) where rev isn't filtered

1964

_uncheckedparentrevs = parentrevs

1964

_uncheckedparentrevs = parentrevs

1965

1966

def node(self, rev):

1966

def node(self, rev):

1967

try:

1967

try:

1968

return self.index[rev][7]

1968

return self.index[rev][7]

1969

except IndexError:

1969

except IndexError:

1970

if rev == wdirrev:

1970

if rev == wdirrev:

1971

raise error.WdirUnsupported

1971

raise error.WdirUnsupported

1972

raise

1972

raise

1973

1974

# Derived from index values.

1974

# Derived from index values.

1975

1976

def end(self, rev):

1976

def end(self, rev):

1977

return self.start(rev) + self.length(rev)

1977

return self.start(rev) + self.length(rev)

1978

1979

def parents(self, node):

1979

def parents(self, node):

1980

i = self.index

1980

i = self.index

1981

d = i[self.rev(node)]

1981

d = i[self.rev(node)]

1982

# inline node() to avoid function call overhead

1982

# inline node() to avoid function call overhead

1983

if self.feature_config.canonical_parent_order and d[5] == self.nullid:

1983

if self.feature_config.canonical_parent_order and d[5] == self.nullid:

1984

return i[d[6]][7], i[d[5]][7]

1984

return i[d[6]][7], i[d[5]][7]

1985

else:

1985

else:

1986

return i[d[5]][7], i[d[6]][7]

1986

return i[d[5]][7], i[d[6]][7]

1987

1988

def chainlen(self, rev):

1988

def chainlen(self, rev):

1989

return self._chaininfo(rev)[0]

1989

return self._chaininfo(rev)[0]

1990

1991

def _chaininfo(self, rev):

1991

def _chaininfo(self, rev):

1992

chaininfocache = self._chaininfocache

1992

chaininfocache = self._chaininfocache

1993

if rev in chaininfocache:

1993

if rev in chaininfocache:

1994

return chaininfocache[rev]

1994

return chaininfocache[rev]

1995

index = self.index

1995

index = self.index

1996

generaldelta = self.delta_config.general_delta

1996

generaldelta = self.delta_config.general_delta

1997

iterrev = rev

1997

iterrev = rev

1998

e = index[iterrev]

1998

e = index[iterrev]

1999

clen = 0

1999

clen = 0

2000

compresseddeltalen = 0

2000

compresseddeltalen = 0

2001

while iterrev != e[3]:

2001

while iterrev != e[3]:

2002

clen += 1

2002

clen += 1

2003

compresseddeltalen += e[1]

2003

compresseddeltalen += e[1]

2004

if generaldelta:

2004

if generaldelta:

2005

iterrev = e[3]

2005

iterrev = e[3]

2006

else:

2006

else:

2007

iterrev -= 1

2007

iterrev -= 1

2008

if iterrev in chaininfocache:

2008

if iterrev in chaininfocache:

2009

t = chaininfocache[iterrev]

2009

t = chaininfocache[iterrev]

2010

clen += t[0]

2010

clen += t[0]

2011

compresseddeltalen += t[1]

2011

compresseddeltalen += t[1]

2012

break

2012

break

2013

e = index[iterrev]

2013

e = index[iterrev]

2014

else:

2014

else:

2015

# Add text length of base since decompressing that also takes

2015

# Add text length of base since decompressing that also takes

2016

# work. For cache hits the length is already included.

2016

# work. For cache hits the length is already included.

2017

compresseddeltalen += e[1]

2017

compresseddeltalen += e[1]

2018

r = (clen, compresseddeltalen)

2018

r = (clen, compresseddeltalen)

2019

chaininfocache[rev] = r

2019

chaininfocache[rev] = r

2020

return r

2020

return r

2021

2022

def _deltachain(self, rev, stoprev=None):

2022

def _deltachain(self, rev, stoprev=None):

2023

return self._inner._deltachain(rev, stoprev=stoprev)

2023

return self._inner._deltachain(rev, stoprev=stoprev)

2024

2025

def ancestors(self, revs, stoprev=0, inclusive=False):

2025

def ancestors(self, revs, stoprev=0, inclusive=False):

2026

"""Generate the ancestors of 'revs' in reverse revision order.

2026

"""Generate the ancestors of 'revs' in reverse revision order.

2027

Does not generate revs lower than stoprev.

2027

Does not generate revs lower than stoprev.

2028

2029

See the documentation for ancestor.lazyancestors for more details."""

2029

See the documentation for ancestor.lazyancestors for more details."""

2030

2031

# first, make sure start revisions aren't filtered

2031

# first, make sure start revisions aren't filtered

2032

revs = list(revs)

2032

revs = list(revs)

2033

checkrev = self.node

2033

checkrev = self.node

2034

for r in revs:

2034

for r in revs:

2035

checkrev(r)

2035

checkrev(r)

2036

# and we're sure ancestors aren't filtered as well

2036

# and we're sure ancestors aren't filtered as well

2037

2038

if rustancestor is not None and self.index.rust_ext_compat:

2038

if rustancestor is not None and self.index.rust_ext_compat:

2039

lazyancestors = rustancestor.LazyAncestors

2039

lazyancestors = rustancestor.LazyAncestors

2040

arg = self.index

2040

arg = self.index

2041

else:

2041

else:

2042

lazyancestors = ancestor.lazyancestors

2042

lazyancestors = ancestor.lazyancestors

2043

arg = self._uncheckedparentrevs

2043

arg = self._uncheckedparentrevs

2044

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

2044

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

2045

2046

def descendants(self, revs):

2046

def descendants(self, revs):

2047

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

2047

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

2048

2049

def findcommonmissing(self, common=None, heads=None):

2049

def findcommonmissing(self, common=None, heads=None):

2050

"""Return a tuple of the ancestors of common and the ancestors of heads

2050

"""Return a tuple of the ancestors of common and the ancestors of heads

2051

that are not ancestors of common. In revset terminology, we return the

2051

that are not ancestors of common. In revset terminology, we return the

2052

tuple:

2052

tuple:

2053

2054

::common, (::heads) - (::common)

2054

::common, (::heads) - (::common)

2055

2056

The list is sorted by revision number, meaning it is

2056

The list is sorted by revision number, meaning it is

2057

topologically sorted.

2057

topologically sorted.

2058

2059

'heads' and 'common' are both lists of node IDs. If heads is

2059

'heads' and 'common' are both lists of node IDs. If heads is

2060

not supplied, uses all of the revlog's heads. If common is not

2060

not supplied, uses all of the revlog's heads. If common is not

2061

supplied, uses nullid."""

2061

supplied, uses nullid."""

2062

if common is None:

2062

if common is None:

2063

common = [self.nullid]

2063

common = [self.nullid]

2064

if heads is None:

2064

if heads is None:

2065

heads = self.heads()

2065

heads = self.heads()

2066

2067

common = [self.rev(n) for n in common]

2067

common = [self.rev(n) for n in common]

2068

heads = [self.rev(n) for n in heads]

2068

heads = [self.rev(n) for n in heads]

2069

2070

# we want the ancestors, but inclusive

2070

# we want the ancestors, but inclusive

2071

class lazyset:

2071

class lazyset:

2072

def __init__(self, lazyvalues):

2072

def __init__(self, lazyvalues):

2073

self.addedvalues = set()

2073

self.addedvalues = set()

2074

self.lazyvalues = lazyvalues

2074

self.lazyvalues = lazyvalues

2075

2076

def __contains__(self, value):

2076

def __contains__(self, value):

2077

return value in self.addedvalues or value in self.lazyvalues

2077

return value in self.addedvalues or value in self.lazyvalues

2078

2079

def __iter__(self):

2079

def __iter__(self):

2080

added = self.addedvalues

2080

added = self.addedvalues

2081

for r in added:

2081

for r in added:

2082

yield r

2082

yield r

2083

for r in self.lazyvalues:

2083

for r in self.lazyvalues:

2084

if not r in added:

2084

if not r in added:

2085

yield r

2085

yield r

2086

2087

def add(self, value):

2087

def add(self, value):

2088

self.addedvalues.add(value)

2088

self.addedvalues.add(value)

2089

2090

def update(self, values):

2090

def update(self, values):

2091

self.addedvalues.update(values)

2091

self.addedvalues.update(values)

2092

2093

has = lazyset(self.ancestors(common))

2093

has = lazyset(self.ancestors(common))

2094

has.add(nullrev)

2094

has.add(nullrev)

2095

has.update(common)

2095

has.update(common)

2096

2097

# take all ancestors from heads that aren't in has

2097

# take all ancestors from heads that aren't in has

2098

missing = set()

2098

missing = set()

2099

visit = collections.deque(r for r in heads if r not in has)

2099

visit = collections.deque(r for r in heads if r not in has)

2100

while visit:

2100

while visit:

2101

r = visit.popleft()

2101

r = visit.popleft()

2102

if r in missing:

2102

if r in missing:

2103

continue

2103

continue

2104

else:

2104

else:

2105

missing.add(r)

2105

missing.add(r)

2106

for p in self.parentrevs(r):

2106

for p in self.parentrevs(r):

2107

if p not in has:

2107

if p not in has:

2108

visit.append(p)

2108

visit.append(p)

2109

missing = list(missing)

2109

missing = list(missing)

2110

missing.sort()

2110

missing.sort()

2111

return has, [self.node(miss) for miss in missing]

2111

return has, [self.node(miss) for miss in missing]

2112

2113

def incrementalmissingrevs(self, common=None):

2113

def incrementalmissingrevs(self, common=None):

2114

"""Return an object that can be used to incrementally compute the

2114

"""Return an object that can be used to incrementally compute the

2115

revision numbers of the ancestors of arbitrary sets that are not

2115

revision numbers of the ancestors of arbitrary sets that are not

2116

ancestors of common. This is an ancestor.incrementalmissingancestors

2116

ancestors of common. This is an ancestor.incrementalmissingancestors

2117

object.

2117

object.

2118

2119

'common' is a list of revision numbers. If common is not supplied, uses

2119

'common' is a list of revision numbers. If common is not supplied, uses

2120

nullrev.

2120

nullrev.

2121

"""

2121

"""

2122

if common is None:

2122

if common is None:

2123

common = [nullrev]

2123

common = [nullrev]

2124

2125

if rustancestor is not None and self.index.rust_ext_compat:

2125

if rustancestor is not None and self.index.rust_ext_compat:

2126

return rustancestor.MissingAncestors(self.index, common)

2126

return rustancestor.MissingAncestors(self.index, common)

2127

return ancestor.incrementalmissingancestors(self.parentrevs, common)

2127

return ancestor.incrementalmissingancestors(self.parentrevs, common)

2128

2129

def findmissingrevs(self, common=None, heads=None):

2129

def findmissingrevs(self, common=None, heads=None):

2130

"""Return the revision numbers of the ancestors of heads that

2130

"""Return the revision numbers of the ancestors of heads that

2131

are not ancestors of common.

2131

are not ancestors of common.

2132

2133

More specifically, return a list of revision numbers corresponding to

2133

More specifically, return a list of revision numbers corresponding to

2134

nodes N such that every N satisfies the following constraints:

2134

nodes N such that every N satisfies the following constraints:

2135

2136

1. N is an ancestor of some node in 'heads'

2136

1. N is an ancestor of some node in 'heads'

2137

2. N is not an ancestor of any node in 'common'

2137

2. N is not an ancestor of any node in 'common'

2138

2139

The list is sorted by revision number, meaning it is

2139

The list is sorted by revision number, meaning it is

2140

topologically sorted.

2140

topologically sorted.

2141

2142

'heads' and 'common' are both lists of revision numbers. If heads is

2142

'heads' and 'common' are both lists of revision numbers. If heads is

2143

not supplied, uses all of the revlog's heads. If common is not

2143

not supplied, uses all of the revlog's heads. If common is not

2144

supplied, uses nullid."""

2144

supplied, uses nullid."""

2145

if common is None:

2145

if common is None:

2146

common = [nullrev]

2146

common = [nullrev]

2147

if heads is None:

2147

if heads is None:

2148

heads = self.headrevs()

2148

heads = self.headrevs()

2149

2150

inc = self.incrementalmissingrevs(common=common)

2150

inc = self.incrementalmissingrevs(common=common)

2151

return inc.missingancestors(heads)

2151

return inc.missingancestors(heads)

2152

2153

def findmissing(self, common=None, heads=None):

2153

def findmissing(self, common=None, heads=None):

2154

"""Return the ancestors of heads that are not ancestors of common.

2154

"""Return the ancestors of heads that are not ancestors of common.

2155

2156

More specifically, return a list of nodes N such that every N

2156

More specifically, return a list of nodes N such that every N

2157

satisfies the following constraints:

2157

satisfies the following constraints:

2158

2159

1. N is an ancestor of some node in 'heads'

2159

1. N is an ancestor of some node in 'heads'

2160

2. N is not an ancestor of any node in 'common'

2160

2. N is not an ancestor of any node in 'common'

2161

2162

The list is sorted by revision number, meaning it is

2162

The list is sorted by revision number, meaning it is

2163

topologically sorted.

2163

topologically sorted.

2164

2165

'heads' and 'common' are both lists of node IDs. If heads is

2165

'heads' and 'common' are both lists of node IDs. If heads is

2166

not supplied, uses all of the revlog's heads. If common is not

2166

not supplied, uses all of the revlog's heads. If common is not

2167

supplied, uses nullid."""

2167

supplied, uses nullid."""

2168

if common is None:

2168

if common is None:

2169

common = [self.nullid]

2169

common = [self.nullid]

2170

if heads is None:

2170

if heads is None:

2171

heads = self.heads()

2171

heads = self.heads()

2172

2173

common = [self.rev(n) for n in common]

2173

common = [self.rev(n) for n in common]

2174

heads = [self.rev(n) for n in heads]

2174

heads = [self.rev(n) for n in heads]

2175

2176

inc = self.incrementalmissingrevs(common=common)

2176

inc = self.incrementalmissingrevs(common=common)

2177

return [self.node(r) for r in inc.missingancestors(heads)]

2177

return [self.node(r) for r in inc.missingancestors(heads)]

2178

2179

def nodesbetween(self, roots=None, heads=None):

2179

def nodesbetween(self, roots=None, heads=None):

2180

"""Return a topological path from 'roots' to 'heads'.

2180

"""Return a topological path from 'roots' to 'heads'.

2181

2182

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

2182

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

2183

topologically sorted list of all nodes N that satisfy both of

2183

topologically sorted list of all nodes N that satisfy both of

2184

these constraints:

2184

these constraints:

2185

2186

1. N is a descendant of some node in 'roots'

2186

1. N is a descendant of some node in 'roots'

2187

2. N is an ancestor of some node in 'heads'

2187

2. N is an ancestor of some node in 'heads'

2188

2189

Every node is considered to be both a descendant and an ancestor

2189

Every node is considered to be both a descendant and an ancestor

2190

of itself, so every reachable node in 'roots' and 'heads' will be

2190

of itself, so every reachable node in 'roots' and 'heads' will be

2191

included in 'nodes'.

2191

included in 'nodes'.

2192

2193

'outroots' is the list of reachable nodes in 'roots', i.e., the

2193

'outroots' is the list of reachable nodes in 'roots', i.e., the

2194

subset of 'roots' that is returned in 'nodes'. Likewise,

2194

subset of 'roots' that is returned in 'nodes'. Likewise,

2195

'outheads' is the subset of 'heads' that is also in 'nodes'.

2195

'outheads' is the subset of 'heads' that is also in 'nodes'.

2196

2197

'roots' and 'heads' are both lists of node IDs. If 'roots' is

2197

'roots' and 'heads' are both lists of node IDs. If 'roots' is

2198

unspecified, uses nullid as the only root. If 'heads' is

2198

unspecified, uses nullid as the only root. If 'heads' is

2199

unspecified, uses list of all of the revlog's heads."""

2199

unspecified, uses list of all of the revlog's heads."""

2200

nonodes = ([], [], [])

2200

nonodes = ([], [], [])

2201

if roots is not None:

2201

if roots is not None:

2202

roots = list(roots)

2202

roots = list(roots)

2203

if not roots:

2203

if not roots:

2204

return nonodes

2204

return nonodes

2205

lowestrev = min([self.rev(n) for n in roots])

2205

lowestrev = min([self.rev(n) for n in roots])

2206

else:

2206

else:

2207

roots = [self.nullid] # Everybody's a descendant of nullid

2207

roots = [self.nullid] # Everybody's a descendant of nullid

2208

lowestrev = nullrev

2208

lowestrev = nullrev

2209

if (lowestrev == nullrev) and (heads is None):

2209

if (lowestrev == nullrev) and (heads is None):

2210

# We want _all_ the nodes!

2210

# We want _all_ the nodes!

2211

return (

2211

return (

2212

[self.node(r) for r in self],

2212

[self.node(r) for r in self],

2213

[self.nullid],

2213

[self.nullid],

2214

list(self.heads()),

2214

list(self.heads()),

2215

)

2215

)

2216

if heads is None:

2216

if heads is None:

2217

# All nodes are ancestors, so the latest ancestor is the last

2217

# All nodes are ancestors, so the latest ancestor is the last

2218

# node.

2218

# node.

2219

highestrev = len(self) - 1

2219

highestrev = len(self) - 1

2220

# Set ancestors to None to signal that every node is an ancestor.

2220

# Set ancestors to None to signal that every node is an ancestor.

2221

ancestors = None

2221

ancestors = None

2222

# Set heads to an empty dictionary for later discovery of heads

2222

# Set heads to an empty dictionary for later discovery of heads

2223

heads = {}

2223

heads = {}

2224

else:

2224

else:

2225

heads = list(heads)

2225

heads = list(heads)

2226

if not heads:

2226

if not heads:

2227

return nonodes

2227

return nonodes

2228

ancestors = set()

2228

ancestors = set()

2229

# Turn heads into a dictionary so we can remove 'fake' heads.

2229

# Turn heads into a dictionary so we can remove 'fake' heads.

2230

# Also, later we will be using it to filter out the heads we can't

2230

# Also, later we will be using it to filter out the heads we can't

2231

# find from roots.

2231

# find from roots.

2232

heads = dict.fromkeys(heads, False)

2232

heads = dict.fromkeys(heads, False)

2233

# Start at the top and keep marking parents until we're done.

2233

# Start at the top and keep marking parents until we're done.

2234

nodestotag = set(heads)

2234

nodestotag = set(heads)

2235

# Remember where the top was so we can use it as a limit later.

2235

# Remember where the top was so we can use it as a limit later.

2236

highestrev = max([self.rev(n) for n in nodestotag])

2236

highestrev = max([self.rev(n) for n in nodestotag])

2237

while nodestotag:

2237

while nodestotag:

2238

# grab a node to tag

2238

# grab a node to tag

2239

n = nodestotag.pop()

2239

n = nodestotag.pop()

2240

# Never tag nullid

2240

# Never tag nullid

2241

if n == self.nullid:

2241

if n == self.nullid:

2242

continue

2242

continue

2243

# A node's revision number represents its place in a

2243

# A node's revision number represents its place in a

2244

# topologically sorted list of nodes.

2244

# topologically sorted list of nodes.

2245

r = self.rev(n)

2245

r = self.rev(n)

2246

if r >= lowestrev:

2246

if r >= lowestrev:

2247

if n not in ancestors:

2247

if n not in ancestors:

2248

# If we are possibly a descendant of one of the roots

2248

# If we are possibly a descendant of one of the roots

2249

# and we haven't already been marked as an ancestor

2249

# and we haven't already been marked as an ancestor

2250

ancestors.add(n) # Mark as ancestor

2250

ancestors.add(n) # Mark as ancestor

2251

# Add non-nullid parents to list of nodes to tag.

2251

# Add non-nullid parents to list of nodes to tag.

2252

nodestotag.update(

2252

nodestotag.update(

2253

[p for p in self.parents(n) if p != self.nullid]

2253

[p for p in self.parents(n) if p != self.nullid]

2254

)

2254

)

2255

elif n in heads: # We've seen it before, is it a fake head?

2255

elif n in heads: # We've seen it before, is it a fake head?

2256

# So it is, real heads should not be the ancestors of

2256

# So it is, real heads should not be the ancestors of

2257

# any other heads.

2257

# any other heads.

2258

heads.pop(n)

2258

heads.pop(n)

2259

if not ancestors:

2259

if not ancestors:

2260

return nonodes

2260

return nonodes

2261

# Now that we have our set of ancestors, we want to remove any

2261

# Now that we have our set of ancestors, we want to remove any

2262

# roots that are not ancestors.

2262

# roots that are not ancestors.

2263

2264

# If one of the roots was nullid, everything is included anyway.

2264

# If one of the roots was nullid, everything is included anyway.

2265

if lowestrev > nullrev:

2265

if lowestrev > nullrev:

2266

# But, since we weren't, let's recompute the lowest rev to not

2266

# But, since we weren't, let's recompute the lowest rev to not

2267

# include roots that aren't ancestors.

2267

# include roots that aren't ancestors.

2268

2269

# Filter out roots that aren't ancestors of heads

2269

# Filter out roots that aren't ancestors of heads

2270

roots = [root for root in roots if root in ancestors]

2270

roots = [root for root in roots if root in ancestors]

2271

# Recompute the lowest revision

2271

# Recompute the lowest revision

2272

if roots:

2272

if roots:

2273

lowestrev = min([self.rev(root) for root in roots])

2273

lowestrev = min([self.rev(root) for root in roots])

2274

else:

2274

else:

2275

# No more roots? Return empty list

2275

# No more roots? Return empty list

2276

return nonodes

2276

return nonodes

2277

else:

2277

else:

2278

# We are descending from nullid, and don't need to care about

2278

# We are descending from nullid, and don't need to care about

2279

# any other roots.

2279

# any other roots.

2280

lowestrev = nullrev

2280

lowestrev = nullrev

2281

roots = [self.nullid]

2281

roots = [self.nullid]

2282

# Transform our roots list into a set.

2282

# Transform our roots list into a set.

2283

descendants = set(roots)

2283

descendants = set(roots)

2284

# Also, keep the original roots so we can filter out roots that aren't

2284

# Also, keep the original roots so we can filter out roots that aren't

2285

# 'real' roots (i.e. are descended from other roots).

2285

# 'real' roots (i.e. are descended from other roots).

2286

roots = descendants.copy()

2286

roots = descendants.copy()

2287

# Our topologically sorted list of output nodes.

2287

# Our topologically sorted list of output nodes.

2288

orderedout = []

2288

orderedout = []

2289

# Don't start at nullid since we don't want nullid in our output list,

2289

# Don't start at nullid since we don't want nullid in our output list,

2290

# and if nullid shows up in descendants, empty parents will look like

2290

# and if nullid shows up in descendants, empty parents will look like

2291

# they're descendants.

2291

# they're descendants.

2292

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

2292

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

2293

n = self.node(r)

2293

n = self.node(r)

2294

isdescendant = False

2294

isdescendant = False

2295

if lowestrev == nullrev: # Everybody is a descendant of nullid

2295

if lowestrev == nullrev: # Everybody is a descendant of nullid

2296

isdescendant = True

2296

isdescendant = True

2297

elif n in descendants:

2297

elif n in descendants:

2298

# n is already a descendant

2298

# n is already a descendant

2299

isdescendant = True

2299

isdescendant = True

2300

# This check only needs to be done here because all the roots

2300

# This check only needs to be done here because all the roots

2301

# will start being marked is descendants before the loop.

2301

# will start being marked is descendants before the loop.

2302

if n in roots:

2302

if n in roots:

2303

# If n was a root, check if it's a 'real' root.

2303

# If n was a root, check if it's a 'real' root.

2304

p = tuple(self.parents(n))

2304

p = tuple(self.parents(n))

2305

# If any of its parents are descendants, it's not a root.

2305

# If any of its parents are descendants, it's not a root.

2306

if (p[0] in descendants) or (p[1] in descendants):

2306

if (p[0] in descendants) or (p[1] in descendants):

2307

roots.remove(n)

2307

roots.remove(n)

2308

else:

2308

else:

2309

p = tuple(self.parents(n))

2309

p = tuple(self.parents(n))

2310

# A node is a descendant if either of its parents are

2310

# A node is a descendant if either of its parents are

2311

# descendants. (We seeded the dependents list with the roots

2311

# descendants. (We seeded the dependents list with the roots

2312

# up there, remember?)

2312

# up there, remember?)

2313

if (p[0] in descendants) or (p[1] in descendants):

2313

if (p[0] in descendants) or (p[1] in descendants):

2314

descendants.add(n)

2314

descendants.add(n)

2315

isdescendant = True

2315

isdescendant = True

2316

if isdescendant and ((ancestors is None) or (n in ancestors)):

2316

if isdescendant and ((ancestors is None) or (n in ancestors)):

2317

# Only include nodes that are both descendants and ancestors.

2317

# Only include nodes that are both descendants and ancestors.

2318

orderedout.append(n)

2318

orderedout.append(n)

2319

if (ancestors is not None) and (n in heads):

2319

if (ancestors is not None) and (n in heads):

2320

# We're trying to figure out which heads are reachable

2320

# We're trying to figure out which heads are reachable

2321

# from roots.

2321

# from roots.

2322

# Mark this head as having been reached

2322

# Mark this head as having been reached

2323

heads[n] = True

2323

heads[n] = True

2324

elif ancestors is None:

2324

elif ancestors is None:

2325

# Otherwise, we're trying to discover the heads.

2325

# Otherwise, we're trying to discover the heads.

2326

# Assume this is a head because if it isn't, the next step

2326

# Assume this is a head because if it isn't, the next step

2327

# will eventually remove it.

2327

# will eventually remove it.

2328

heads[n] = True

2328

heads[n] = True

2329

# But, obviously its parents aren't.

2329

# But, obviously its parents aren't.

2330

for p in self.parents(n):

2330

for p in self.parents(n):

2331

heads.pop(p, None)

2331

heads.pop(p, None)

2332

heads = [head for head, flag in heads.items() if flag]

2332

heads = [head for head, flag in heads.items() if flag]

2333

roots = list(roots)

2333

roots = list(roots)

2334

assert orderedout

2334

assert orderedout

2335

assert roots

2335

assert roots

2336

assert heads

2336

assert heads

2337

return (orderedout, roots, heads)

2337

return (orderedout, roots, heads)

2338

2339

def headrevs(self, revs=None):

2339

def headrevs(self, revs=None):

2340

if revs is None:

2340

if revs is None:

2341

try:

2341

try:

2342

return self.index.headrevs()

2342

return self.index.headrevs()

2343

except AttributeError:

2343

except AttributeError:

2344

return self._headrevs()

2344

return self._headrevs()

2345

if rustdagop is not None and self.index.rust_ext_compat:

2345

if rustdagop is not None and self.index.rust_ext_compat:

2346

return rustdagop.headrevs(self.index, revs)

2346

return rustdagop.headrevs(self.index, revs)

2347

return dagop.headrevs(revs, self._uncheckedparentrevs)

2347

return dagop.headrevs(revs, self._uncheckedparentrevs)

2348

2349

def computephases(self, roots):

2349

def computephases(self, roots):

2350

return self.index.computephasesmapsets(roots)

2350

return self.index.computephasesmapsets(roots)

2351

2352

def _headrevs(self):

2352

def _headrevs(self):

2353

count = len(self)

2353

count = len(self)

2354

if not count:

2354

if not count:

2355

return [nullrev]

2355

return [nullrev]

2356

# we won't iter over filtered rev so nobody is a head at start

2356

# we won't iter over filtered rev so nobody is a head at start

2357

ishead = [0] * (count + 1)

2357

ishead = [0] * (count + 1)

2358

index = self.index

2358

index = self.index

2359

for r in self:

2359

for r in self:

2360

ishead[r] = 1 # I may be an head

2360

ishead[r] = 1 # I may be an head

2361

e = index[r]

2361

e = index[r]

2362

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

2362

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

2363

return [r for r, val in enumerate(ishead) if val]

2363

return [r for r, val in enumerate(ishead) if val]

2364

2365

def _head_node_ids(self):

2365

def _head_node_ids(self):

2366

try:

2366

try:

2367

return self.index.head_node_ids()

2367

return self.index.head_node_ids()

2368

except AttributeError:

2368

except AttributeError:

2369

return [self.node(r) for r in self.headrevs()]

2369

return [self.node(r) for r in self.headrevs()]

2370

2371

def heads(self, start=None, stop=None):

2371

def heads(self, start=None, stop=None):

2372

"""return the list of all nodes that have no children

2372

"""return the list of all nodes that have no children

2373

2374

if start is specified, only heads that are descendants of

2374

if start is specified, only heads that are descendants of

2375

start will be returned

2375

start will be returned

2376

if stop is specified, it will consider all the revs from stop

2376

if stop is specified, it will consider all the revs from stop

2377

as if they had no children

2377

as if they had no children

2378

"""

2378

"""

2379

if start is None and stop is None:

2379

if start is None and stop is None:

2380

if not len(self):

2380

if not len(self):

2381

return [self.nullid]

2381

return [self.nullid]

2382

return self._head_node_ids()

2382

return self._head_node_ids()

2383

if start is None:

2383

if start is None:

2384

start = nullrev

2384

start = nullrev

2385

else:

2385

else:

2386

start = self.rev(start)

2386

start = self.rev(start)

2387

2388

stoprevs = {self.rev(n) for n in stop or []}

2388

stoprevs = {self.rev(n) for n in stop or []}

2389

2390

revs = dagop.headrevssubset(

2390

revs = dagop.headrevssubset(

2391

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

2391

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

2392

)

2392

)

2393

2394

return [self.node(rev) for rev in revs]

2394

return [self.node(rev) for rev in revs]

2395

2396

def children(self, node):

2396

def children(self, node):

2397

"""find the children of a given node"""

2397

"""find the children of a given node"""

2398

c = []

2398

c = []

2399

p = self.rev(node)

2399

p = self.rev(node)

2400

for r in self.revs(start=p + 1):

2400

for r in self.revs(start=p + 1):

2401

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

2401

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

2402

if prevs:

2402

if prevs:

2403

for pr in prevs:

2403

for pr in prevs:

2404

if pr == p:

2404

if pr == p:

2405

c.append(self.node(r))

2405

c.append(self.node(r))

2406

elif p == nullrev:

2406

elif p == nullrev:

2407

c.append(self.node(r))

2407

c.append(self.node(r))

2408

return c

2408

return c

2409

2410

def commonancestorsheads(self, a, b):

2410

def commonancestorsheads(self, a, b):

2411

"""calculate all the heads of the common ancestors of nodes a and b"""

2411

"""calculate all the heads of the common ancestors of nodes a and b"""

2412

a, b = self.rev(a), self.rev(b)

2412

a, b = self.rev(a), self.rev(b)

2413

ancs = self._commonancestorsheads(a, b)

2413

ancs = self._commonancestorsheads(a, b)

2414

return pycompat.maplist(self.node, ancs)

2414

return pycompat.maplist(self.node, ancs)

2415

2416

def _commonancestorsheads(self, *revs):

2416

def _commonancestorsheads(self, *revs):

2417

"""calculate all the heads of the common ancestors of revs"""

2417

"""calculate all the heads of the common ancestors of revs"""

2418

try:

2418

try:

2419

ancs = self.index.commonancestorsheads(*revs)

2419

ancs = self.index.commonancestorsheads(*revs)

2420

except (AttributeError, OverflowError): # C implementation failed

2420

except (AttributeError, OverflowError): # C implementation failed

2421

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

2421

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

2422

return ancs

2422

return ancs

2423

2424

def isancestor(self, a, b):

2424

def isancestor(self, a, b):

2425

"""return True if node a is an ancestor of node b

2425

"""return True if node a is an ancestor of node b

2426

2427

A revision is considered an ancestor of itself."""

2427

A revision is considered an ancestor of itself."""

2428

a, b = self.rev(a), self.rev(b)

2428

a, b = self.rev(a), self.rev(b)

2429

return self.isancestorrev(a, b)

2429

return self.isancestorrev(a, b)

2430

2431

def isancestorrev(self, a, b):

2431

def isancestorrev(self, a, b):

2432

"""return True if revision a is an ancestor of revision b

2432

"""return True if revision a is an ancestor of revision b

2433

2434

A revision is considered an ancestor of itself.

2434

A revision is considered an ancestor of itself.

2435

2436

The implementation of this is trivial but the use of

2436

The implementation of this is trivial but the use of

2437

reachableroots is not."""

2437

reachableroots is not."""

2438

if a == nullrev:

2438

if a == nullrev:

2439

return True

2439

return True

2440

elif a == b:

2440

elif a == b:

2441

return True

2441

return True

2442

elif a > b:

2442

elif a > b:

2443

return False

2443

return False

2444

return bool(self.reachableroots(a, [b], [a], includepath=False))

2444

return bool(self.reachableroots(a, [b], [a], includepath=False))

2445

2446

def reachableroots(self, minroot, heads, roots, includepath=False):

2446

def reachableroots(self, minroot, heads, roots, includepath=False):

2447

"""return (heads(::(<roots> and <roots>::<heads>)))

2447

"""return (heads(::(<roots> and <roots>::<heads>)))

2448

2449

If includepath is True, return (<roots>::<heads>)."""

2449

If includepath is True, return (<roots>::<heads>)."""

2450

try:

2450

try:

2451

return self.index.reachableroots2(

2451

return self.index.reachableroots2(

2452

minroot, heads, roots, includepath

2452

minroot, heads, roots, includepath

2453

)

2453

)

2454

except AttributeError:

2454

except AttributeError:

2455

return dagop._reachablerootspure(

2455

return dagop._reachablerootspure(

2456

self.parentrevs, minroot, roots, heads, includepath

2456

self.parentrevs, minroot, roots, heads, includepath

2457

)

2457

)

2458

2459

def ancestor(self, a, b):

2459

def ancestor(self, a, b):

2460

"""calculate the "best" common ancestor of nodes a and b"""

2460

"""calculate the "best" common ancestor of nodes a and b"""

2461

2462

a, b = self.rev(a), self.rev(b)

2462

a, b = self.rev(a), self.rev(b)

2463

try:

2463

try:

2464

ancs = self.index.ancestors(a, b)

2464

ancs = self.index.ancestors(a, b)

2465

except (AttributeError, OverflowError):

2465

except (AttributeError, OverflowError):

2466

ancs = ancestor.ancestors(self.parentrevs, a, b)

2466

ancs = ancestor.ancestors(self.parentrevs, a, b)

2467

if ancs:

2467

if ancs:

2468

# choose a consistent winner when there's a tie

2468

# choose a consistent winner when there's a tie

2469

return min(map(self.node, ancs))

2469

return min(map(self.node, ancs))

2470

return self.nullid

2470

return self.nullid

2471

2472

def _match(self, id):

2472

def _match(self, id):

2473

if isinstance(id, int):

2473

if isinstance(id, int):

2474

# rev

2474

# rev

2475

return self.node(id)

2475

return self.node(id)

2476

if len(id) == self.nodeconstants.nodelen:

2476

if len(id) == self.nodeconstants.nodelen:

2477

# possibly a binary node

2477

# possibly a binary node

2478

# odds of a binary node being all hex in ASCII are 1 in 10**25

2478

# odds of a binary node being all hex in ASCII are 1 in 10**25

2479

try:

2479

try:

2480

node = id

2480

node = id

2481

self.rev(node) # quick search the index

2481

self.rev(node) # quick search the index

2482

return node

2482

return node

2483

except error.LookupError:

2483

except error.LookupError:

2484

pass # may be partial hex id

2484

pass # may be partial hex id

2485

try:

2485

try:

2486

# str(rev)

2486

# str(rev)

2487

rev = int(id)

2487

rev = int(id)

2488

if b"%d" % rev != id:

2488

if b"%d" % rev != id:

2489

raise ValueError

2489

raise ValueError

2490

if rev < 0:

2490

if rev < 0:

2491

rev = len(self) + rev

2491

rev = len(self) + rev

2492

if rev < 0 or rev >= len(self):

2492

if rev < 0 or rev >= len(self):

2493

raise ValueError

2493

raise ValueError

2494

return self.node(rev)

2494

return self.node(rev)

2495

except (ValueError, OverflowError):

2495

except (ValueError, OverflowError):

2496

pass

2496

pass

2497

if len(id) == 2 * self.nodeconstants.nodelen:

2497

if len(id) == 2 * self.nodeconstants.nodelen:

2498

try:

2498

try:

2499

# a full hex nodeid?

2499

# a full hex nodeid?

2500

node = bin(id)

2500

node = bin(id)

2501

self.rev(node)

2501

self.rev(node)

2502

return node

2502

return node

2503

except (binascii.Error, error.LookupError):

2503

except (binascii.Error, error.LookupError):

2504

pass

2504

pass

2505

2506

def _partialmatch(self, id):

2506

def _partialmatch(self, id):

2507

# we don't care wdirfilenodeids as they should be always full hash

2507

# we don't care wdirfilenodeids as they should be always full hash

2508

maybewdir = self.nodeconstants.wdirhex.startswith(id)

2508

maybewdir = self.nodeconstants.wdirhex.startswith(id)

2509

ambiguous = False

2509

ambiguous = False

2510

try:

2510

try:

2511

partial = self.index.partialmatch(id)

2511

partial = self.index.partialmatch(id)

2512

if partial and self.hasnode(partial):

2512

if partial and self.hasnode(partial):

2513

if maybewdir:

2513

if maybewdir:

2514

# single 'ff...' match in radix tree, ambiguous with wdir

2514

# single 'ff...' match in radix tree, ambiguous with wdir

2515

ambiguous = True

2515

ambiguous = True

2516

else:

2516

else:

2517

return partial

2517

return partial

2518

elif maybewdir:

2518

elif maybewdir:

2519

# no 'ff...' match in radix tree, wdir identified

2519

# no 'ff...' match in radix tree, wdir identified

2520

raise error.WdirUnsupported

2520

raise error.WdirUnsupported

2521

else:

2521

else:

2522

return None

2522

return None

2523

except error.RevlogError:

2523

except error.RevlogError:

2524

# parsers.c radix tree lookup gave multiple matches

2524

# parsers.c radix tree lookup gave multiple matches

2525

# fast path: for unfiltered changelog, radix tree is accurate

2525

# fast path: for unfiltered changelog, radix tree is accurate

2526

if not getattr(self, 'filteredrevs', None):

2526

if not getattr(self, 'filteredrevs', None):

2527

ambiguous = True

2527

ambiguous = True

2528

# fall through to slow path that filters hidden revisions

2528

# fall through to slow path that filters hidden revisions

2529

except (AttributeError, ValueError):

2529

except (AttributeError, ValueError):

2530

# we are pure python, or key is not hex

2530

# we are pure python, or key is not hex

2531

pass

2531

pass

2532

if ambiguous:

2532

if ambiguous:

2533

raise error.AmbiguousPrefixLookupError(

2533

raise error.AmbiguousPrefixLookupError(

2534

id, self.display_id, _(b'ambiguous identifier')

2534

id, self.display_id, _(b'ambiguous identifier')

2535

)

2535

)

2536

2537

if id in self._pcache:

2537

if id in self._pcache:

2538

return self._pcache[id]

2538

return self._pcache[id]

2539

2540

if len(id) <= 40:

2540

if len(id) <= 40:

2541

# hex(node)[:...]

2541

# hex(node)[:...]

2542

l = len(id) // 2 * 2 # grab an even number of digits

2542

l = len(id) // 2 * 2 # grab an even number of digits

2543

try:

2543

try:

2544

# we're dropping the last digit, so let's check that it's hex,

2544

# we're dropping the last digit, so let's check that it's hex,

2545

# to avoid the expensive computation below if it's not

2545

# to avoid the expensive computation below if it's not

2546

if len(id) % 2 > 0:

2546

if len(id) % 2 > 0:

2547

if not (id[-1] in hexdigits):

2547

if not (id[-1] in hexdigits):

2548

return None

2548

return None

2549

prefix = bin(id[:l])

2549

prefix = bin(id[:l])

2550

except binascii.Error:

2550

except binascii.Error:

2551

pass

2551

pass

2552

else:

2552

else:

2553

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

2553

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

2554

nl = [

2554

nl = [

2555

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

2555

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

2556

]

2556

]

2557

if self.nodeconstants.nullhex.startswith(id):

2557

if self.nodeconstants.nullhex.startswith(id):

2558

nl.append(self.nullid)

2558

nl.append(self.nullid)

2559

if len(nl) > 0:

2559

if len(nl) > 0:

2560

if len(nl) == 1 and not maybewdir:

2560

if len(nl) == 1 and not maybewdir:

2561

self._pcache[id] = nl[0]

2561

self._pcache[id] = nl[0]

2562

return nl[0]

2562

return nl[0]

2563

raise error.AmbiguousPrefixLookupError(

2563

raise error.AmbiguousPrefixLookupError(

2564

id, self.display_id, _(b'ambiguous identifier')

2564

id, self.display_id, _(b'ambiguous identifier')

2565

)

2565

)

2566

if maybewdir:

2566

if maybewdir:

2567

raise error.WdirUnsupported

2567

raise error.WdirUnsupported

2568

return None

2568

return None

2569

2570

def lookup(self, id):

2570

def lookup(self, id):

2571

"""locate a node based on:

2571

"""locate a node based on:

2572

- revision number or str(revision number)

2572

- revision number or str(revision number)

2573

- nodeid or subset of hex nodeid

2573

- nodeid or subset of hex nodeid

2574

"""

2574

"""

2575

n = self._match(id)

2575

n = self._match(id)

2576

if n is not None:

2576

if n is not None:

2577

return n

2577

return n

2578

n = self._partialmatch(id)

2578

n = self._partialmatch(id)

2579

if n:

2579

if n:

2580

return n

2580

return n

2581

2582

raise error.LookupError(id, self.display_id, _(b'no match found'))

2582

raise error.LookupError(id, self.display_id, _(b'no match found'))

2583

2584

def shortest(self, node, minlength=1):

2584

def shortest(self, node, minlength=1):

2585

"""Find the shortest unambiguous prefix that matches node."""

2585

"""Find the shortest unambiguous prefix that matches node."""

2586

2587

def isvalid(prefix):

2587

def isvalid(prefix):

2588

try:

2588

try:

2589

matchednode = self._partialmatch(prefix)

2589

matchednode = self._partialmatch(prefix)

2590

except error.AmbiguousPrefixLookupError:

2590

except error.AmbiguousPrefixLookupError:

2591

return False

2591

return False

2592

except error.WdirUnsupported:

2592

except error.WdirUnsupported:

2593

# single 'ff...' match

2593

# single 'ff...' match

2594

return True

2594

return True

2595

if matchednode is None:

2595

if matchednode is None:

2596

raise error.LookupError(node, self.display_id, _(b'no node'))

2596

raise error.LookupError(node, self.display_id, _(b'no node'))

2597

return True

2597

return True

2598

2599

def maybewdir(prefix):

2599

def maybewdir(prefix):

2600

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

2600

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

2601

2602

hexnode = hex(node)

2602

hexnode = hex(node)

2603

2604

def disambiguate(hexnode, minlength):

2604

def disambiguate(hexnode, minlength):

2605

"""Disambiguate against wdirid."""

2605

"""Disambiguate against wdirid."""

2606

for length in range(minlength, len(hexnode) + 1):

2606

for length in range(minlength, len(hexnode) + 1):

2607

prefix = hexnode[:length]

2607

prefix = hexnode[:length]

2608

if not maybewdir(prefix):

2608

if not maybewdir(prefix):

2609

return prefix

2609

return prefix

2610

2611

if not getattr(self, 'filteredrevs', None):

2611

if not getattr(self, 'filteredrevs', None):

2612

try:

2612

try:

2613

length = max(self.index.shortest(node), minlength)

2613

length = max(self.index.shortest(node), minlength)

2614

return disambiguate(hexnode, length)

2614

return disambiguate(hexnode, length)

2615

except error.RevlogError:

2615

except error.RevlogError:

2616

if node != self.nodeconstants.wdirid:

2616

if node != self.nodeconstants.wdirid:

2617

raise error.LookupError(

2617

raise error.LookupError(

2618

node, self.display_id, _(b'no node')

2618

node, self.display_id, _(b'no node')

2619

)

2619

)

2620

except AttributeError:

2620

except AttributeError:

2621

# Fall through to pure code

2621

# Fall through to pure code

2622

pass

2622

pass

2623

2624

if node == self.nodeconstants.wdirid:

2624

if node == self.nodeconstants.wdirid:

2625

for length in range(minlength, len(hexnode) + 1):

2625

for length in range(minlength, len(hexnode) + 1):

2626

prefix = hexnode[:length]

2626

prefix = hexnode[:length]

2627

if isvalid(prefix):

2627

if isvalid(prefix):

2628

return prefix

2628

return prefix

2629

2630

for length in range(minlength, len(hexnode) + 1):

2630

for length in range(minlength, len(hexnode) + 1):

2631

prefix = hexnode[:length]

2631

prefix = hexnode[:length]

2632

if isvalid(prefix):

2632

if isvalid(prefix):

2633

return disambiguate(hexnode, length)

2633

return disambiguate(hexnode, length)

2634

2635

def cmp(self, node, text):

2635

def cmp(self, node, text):

2636

"""compare text with a given file revision

2636

"""compare text with a given file revision

2637

2638

returns True if text is different than what is stored.

2638

returns True if text is different than what is stored.

2639

"""

2639

"""

2640

p1, p2 = self.parents(node)

2640

p1, p2 = self.parents(node)

2641

return storageutil.hashrevisionsha1(text, p1, p2) != node

2641

return storageutil.hashrevisionsha1(text, p1, p2) != node

2642

2643

def deltaparent(self, rev):

2643

def deltaparent(self, rev):

2644

"""return deltaparent of the given revision"""

2644

"""return deltaparent of the given revision"""

2645

base = self.index[rev][3]

2645

base = self.index[rev][3]

2646

if base == rev:

2646

if base == rev:

2647

return nullrev

2647

return nullrev

2648

elif self.delta_config.general_delta:

2648

elif self.delta_config.general_delta:

2649

return base

2649

return base

2650

else:

2650

else:

2651

return rev - 1

2651

return rev - 1

2652

2653

def issnapshot(self, rev):

2653

def issnapshot(self, rev):

2654

"""tells whether rev is a snapshot"""

2654

"""tells whether rev is a snapshot"""

2655

ret = self._inner.issnapshot(rev)

2655

ret = self._inner.issnapshot(rev)

2656

self.issnapshot = self._inner.issnapshot

2656

self.issnapshot = self._inner.issnapshot

2657

return ret

2657

return ret

2658

2659

def snapshotdepth(self, rev):

2659

def snapshotdepth(self, rev):

2660

"""number of snapshot in the chain before this one"""

2660

"""number of snapshot in the chain before this one"""

2661

if not self.issnapshot(rev):

2661

if not self.issnapshot(rev):

2662

raise error.ProgrammingError(b'revision %d not a snapshot')

2662

raise error.ProgrammingError(b'revision %d not a snapshot')

2663

return len(self._inner._deltachain(rev)[0]) - 1

2663

return len(self._inner._deltachain(rev)[0]) - 1

2664

2665

def revdiff(self, rev1, rev2):

2665

def revdiff(self, rev1, rev2):

2666

"""return or calculate a delta between two revisions

2666

"""return or calculate a delta between two revisions

2667

2668

The delta calculated is in binary form and is intended to be written to

2668

The delta calculated is in binary form and is intended to be written to

2669

revlog data directly. So this function needs raw revision data.

2669

revlog data directly. So this function needs raw revision data.

2670

"""

2670

"""

2671

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2671

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2672

return bytes(self._inner._chunk(rev2))

2672

return bytes(self._inner._chunk(rev2))

2673

2674

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2674

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2675

2676

def revision(self, nodeorrev):

2676

def revision(self, nodeorrev):

2677

"""return an uncompressed revision of a given node or revision

2677

"""return an uncompressed revision of a given node or revision

2678

number.

2678

number.

2679

"""

2679

"""

2680

return self._revisiondata(nodeorrev)

2680

return self._revisiondata(nodeorrev)

2681

2682

def sidedata(self, nodeorrev):

2682

def sidedata(self, nodeorrev):

2683

"""a map of extra data related to the changeset but not part of the hash

2683

"""a map of extra data related to the changeset but not part of the hash

2684

2685

This function currently return a dictionary. However, more advanced

2685

This function currently return a dictionary. However, more advanced

2686

mapping object will likely be used in the future for a more

2686

mapping object will likely be used in the future for a more

2687

efficient/lazy code.

2687

efficient/lazy code.

2688

"""

2688

"""

2689

# deal with <nodeorrev> argument type

2689

# deal with <nodeorrev> argument type

2690

if isinstance(nodeorrev, int):

2690

if isinstance(nodeorrev, int):

2691

rev = nodeorrev

2691

rev = nodeorrev

2692

else:

2692

else:

2693

rev = self.rev(nodeorrev)

2693

rev = self.rev(nodeorrev)

2694

return self._sidedata(rev)

2694

return self._sidedata(rev)

2695

2696

def _rawtext(self, node, rev):

2696

def _rawtext(self, node, rev):

2697

"""return the possibly unvalidated rawtext for a revision

2697

"""return the possibly unvalidated rawtext for a revision

2698

2699

returns (rev, rawtext, validated)

2699

returns (rev, rawtext, validated)

2700

"""

2700

"""

2701

# Check if we have the entry in cache

2701

# Check if we have the entry in cache

2702

# The cache entry looks like (node, rev, rawtext)

2702

# The cache entry looks like (node, rev, rawtext)

2703

if self._inner._revisioncache:

2703

if self._inner._revisioncache:

2704

if self._inner._revisioncache[0] == node:

2704

if self._inner._revisioncache[0] == node:

2705

return (rev, self._inner._revisioncache[2], True)

2705

return (rev, self._inner._revisioncache[2], True)

2706

2707

if rev is None:

2707

if rev is None:

2708

rev = self.rev(node)

2708

rev = self.rev(node)

2709

2710

return self._inner.raw_text(node, rev)

2710

return self._inner.raw_text(node, rev)

2711

2712

def _revisiondata(self, nodeorrev, raw=False):

2712

def _revisiondata(self, nodeorrev, raw=False):

2713

# deal with <nodeorrev> argument type

2713

# deal with <nodeorrev> argument type

2714

if isinstance(nodeorrev, int):

2714

if isinstance(nodeorrev, int):

2715

rev = nodeorrev

2715

rev = nodeorrev

2716

node = self.node(rev)

2716

node = self.node(rev)

2717

else:

2717

else:

2718

node = nodeorrev

2718

node = nodeorrev

2719

rev = None

2719

rev = None

2720

2721

# fast path the special `nullid` rev

2721

# fast path the special `nullid` rev

2722

if node == self.nullid:

2722

if node == self.nullid:

2723

return b""

2723

return b""

2724

2725

# ``rawtext`` is the text as stored inside the revlog. Might be the

2725

# ``rawtext`` is the text as stored inside the revlog. Might be the

2726

# revision or might need to be processed to retrieve the revision.

2726

# revision or might need to be processed to retrieve the revision.

2727

rev, rawtext, validated = self._rawtext(node, rev)

2727

rev, rawtext, validated = self._rawtext(node, rev)

2728

2729

if raw and validated:

2729

if raw and validated:

2730

# if we don't want to process the raw text and that raw

2730

# if we don't want to process the raw text and that raw

2731

# text is cached, we can exit early.

2731

# text is cached, we can exit early.

2732

return rawtext

2732

return rawtext

2733

if rev is None:

2733

if rev is None:

2734

rev = self.rev(node)

2734

rev = self.rev(node)

2735

# the revlog's flag for this revision

2735

# the revlog's flag for this revision

2736

# (usually alter its state or content)

2736

# (usually alter its state or content)

2737

flags = self.flags(rev)

2737

flags = self.flags(rev)

2738

2739

if validated and flags == REVIDX_DEFAULT_FLAGS:

2739

if validated and flags == REVIDX_DEFAULT_FLAGS:

2740

# no extra flags set, no flag processor runs, text = rawtext

2740

# no extra flags set, no flag processor runs, text = rawtext

2741

return rawtext

2741

return rawtext

2742

2743

if raw:

2743

if raw:

2744

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2744

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2745

text = rawtext

2745

text = rawtext

2746

else:

2746

else:

2747

r = flagutil.processflagsread(self, rawtext, flags)

2747

r = flagutil.processflagsread(self, rawtext, flags)

2748

text, validatehash = r

2748

text, validatehash = r

2749

if validatehash:

2749

if validatehash:

2750

self.checkhash(text, node, rev=rev)

2750

self.checkhash(text, node, rev=rev)

2751

if not validated:

2751

if not validated:

2752

self._inner._revisioncache = (node, rev, rawtext)

2752

self._inner._revisioncache = (node, rev, rawtext)

2753

2754

return text

2754

return text

2755

2756

def _sidedata(self, rev):

2756

def _sidedata(self, rev):

2757

"""Return the sidedata for a given revision number."""

2757

"""Return the sidedata for a given revision number."""

2758

sidedata_end = None

2758

sidedata_end = None

2759

if self._docket is not None:

2759

if self._docket is not None:

2760

sidedata_end = self._docket.sidedata_end

2760

sidedata_end = self._docket.sidedata_end

2761

return self._inner.sidedata(rev, sidedata_end)

2761

return self._inner.sidedata(rev, sidedata_end)

2762

2763

def rawdata(self, nodeorrev):

2763

def rawdata(self, nodeorrev):

2764

"""return an uncompressed raw data of a given node or revision number."""

2764

"""return an uncompressed raw data of a given node or revision number."""

2765

return self._revisiondata(nodeorrev, raw=True)

2765

return self._revisiondata(nodeorrev, raw=True)

2766

2767

def hash(self, text, p1, p2):

2767

def hash(self, text, p1, p2):

2768

"""Compute a node hash.

2768

"""Compute a node hash.

2769

2770

Available as a function so that subclasses can replace the hash

2770

Available as a function so that subclasses can replace the hash

2771

as needed.

2771

as needed.

2772

"""

2772

"""

2773

return storageutil.hashrevisionsha1(text, p1, p2)

2773

return storageutil.hashrevisionsha1(text, p1, p2)

2774

2775

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2775

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2776

"""Check node hash integrity.

2776

"""Check node hash integrity.

2777

2778

Available as a function so that subclasses can extend hash mismatch

2778

Available as a function so that subclasses can extend hash mismatch

2779

behaviors as needed.

2779

behaviors as needed.

2780

"""

2780

"""

2781

try:

2781

try:

2782

if p1 is None and p2 is None:

2782

if p1 is None and p2 is None:

2783

p1, p2 = self.parents(node)

2783

p1, p2 = self.parents(node)

2784

if node != self.hash(text, p1, p2):

2784

if node != self.hash(text, p1, p2):

2785

# Clear the revision cache on hash failure. The revision cache

2785

# Clear the revision cache on hash failure. The revision cache

2786

# only stores the raw revision and clearing the cache does have

2786

# only stores the raw revision and clearing the cache does have

2787

# the side-effect that we won't have a cache hit when the raw

2787

# the side-effect that we won't have a cache hit when the raw

2788

# revision data is accessed. But this case should be rare and

2788

# revision data is accessed. But this case should be rare and

2789

# it is extra work to teach the cache about the hash

2789

# it is extra work to teach the cache about the hash

2790

# verification state.

2790

# verification state.

2791

if (

2791

if (

2792

self._inner._revisioncache

2792

self._inner._revisioncache

2793

and self._inner._revisioncache[0] == node

2793

and self._inner._revisioncache[0] == node

2794

):

2794

):

2795

self._inner._revisioncache = None

2795

self._inner._revisioncache = None

2796

2797

revornode = rev

2797

revornode = rev

2798

if revornode is None:

2798

if revornode is None:

2799

revornode = templatefilters.short(hex(node))

2799

revornode = templatefilters.short(hex(node))

2800

raise error.RevlogError(

2800

raise error.RevlogError(

2801

_(b"integrity check failed on %s:%s")

2801

_(b"integrity check failed on %s:%s")

2802

% (self.display_id, pycompat.bytestr(revornode))

2802

% (self.display_id, pycompat.bytestr(revornode))

2803

)

2803

)

2804

except error.RevlogError:

2804

except error.RevlogError:

2805

if self.feature_config.censorable and storageutil.iscensoredtext(

2805

if self.feature_config.censorable and storageutil.iscensoredtext(

2806

text

2806

text

2807

):

2807

):

2808

raise error.CensoredNodeError(self.display_id, node, text)

2808

raise error.CensoredNodeError(self.display_id, node, text)

2809

raise

2809

raise

2810

2811

@property

2811

@property

2812

def _split_index_file(self):

2812

def _split_index_file(self):

2813

"""the path where to expect the index of an ongoing splitting operation

2813

"""the path where to expect the index of an ongoing splitting operation

2814

2815

The file will only exist if a splitting operation is in progress, but

2815

The file will only exist if a splitting operation is in progress, but

2816

it is always expected at the same location."""

2816

it is always expected at the same location."""

2817

parts = self.radix.split(b'/')

2817

parts = self.radix.split(b'/')

2818

if len(parts) > 1:

2818

if len(parts) > 1:

2819

# adds a '-s' prefix to the ``data/` or `meta/` base

2819

# adds a '-s' prefix to the ``data/` or `meta/` base

2820

head = parts[0] + b'-s'

2820

head = parts[0] + b'-s'

2821

mids = parts[1:-1]

2821

mids = parts[1:-1]

2822

tail = parts[-1] + b'.i'

2822

tail = parts[-1] + b'.i'

2823

pieces = [head] + mids + [tail]

2823

pieces = [head] + mids + [tail]

2824

return b'/'.join(pieces)

2824

return b'/'.join(pieces)

2825

else:

2825

else:

2826

# the revlog is stored at the root of the store (changelog or

2826

# the revlog is stored at the root of the store (changelog or

2827

# manifest), no risk of collision.

2827

# manifest), no risk of collision.

2828

return self.radix + b'.i.s'

2828

return self.radix + b'.i.s'

2829

2830

def _enforceinlinesize(self, tr, ~~side_write~~=~~True~~):

2830

def _enforceinlinesize(self, tr):

2831

"""Check if the revlog is too big for inline and convert if so.

2831

"""Check if the revlog is too big for inline and convert if so.

2832

2833

This should be called after revisions are added to the revlog. If the

2833

This should be called after revisions are added to the revlog. If the

2834

revlog has grown too large to be an inline revlog, it will convert it

2834

revlog has grown too large to be an inline revlog, it will convert it

2835

to use multiple index and data files.

2835

to use multiple index and data files.

2836

"""

2836

"""

2837

tiprev = len(self) - 1

2837

tiprev = len(self) - 1

2838

total_size = self.start(tiprev) + self.length(tiprev)

2838

total_size = self.start(tiprev) + self.length(tiprev)

2839

if not self._inline or (self._may_inline and total_size < _maxinline):

2839

if not self._inline or (self._may_inline and total_size < _maxinline):

2840

return

2840

return

2841

2842

if self._docket is not None:

2842

if self._docket is not None:

2843

msg = b"inline revlog should not have a docket"

2843

msg = b"inline revlog should not have a docket"

2844

raise error.ProgrammingError(msg)

2844

raise error.ProgrammingError(msg)

2845

2846

# In the common case, we enforce inline size because the revlog has

2846

# In the common case, we enforce inline size because the revlog has

2847

# been appened too. And in such case, it must have an initial offset

2847

# been appened too. And in such case, it must have an initial offset

2848

# recorded in the transaction.

2848

# recorded in the transaction.

2849

troffset = tr.findoffset(self._inner.canonical_index_file)

2849

troffset = tr.findoffset(self._inner.canonical_index_file)

2850

pre_touched = troffset is not None

2850

pre_touched = troffset is not None

2851

if not pre_touched and self.target[0] != KIND_CHANGELOG:

2851

if not pre_touched and self.target[0] != KIND_CHANGELOG:

2852

raise error.RevlogError(

2852

raise error.RevlogError(

2853

_(b"%s not found in the transaction") % self._indexfile

2853

_(b"%s not found in the transaction") % self._indexfile

2854

)

2854

)

2855

2856

tr.addbackup(self._inner.canonical_index_file, for_offset=pre_touched)

2856

tr.addbackup(self._inner.canonical_index_file, for_offset=pre_touched)

2857

tr.add(self._datafile, 0)

2857

tr.add(self._datafile, 0)

2858

2859

new_index_file_path = None

2859

new_index_file_path = None

2860

if side_write:

2860

old_index_file_path = self._indexfile

2861

~~old~~_index_file_path = self._indexfile

2861

new_index_file_path = self._split_index_file

2862

new_index_file_path = self._split_index_file

2862

opener = self.opener

2863

opener = self.opener

2863

weak_self = weakref.ref(self)

2864

weak_self = weakref.ref(self)

2864

2865

# the "split" index replace the real index when the transaction is

2866

# the "split" index replace the real index when the transaction is

2866

# finalized

2867

# finalized

2867

def finalize_callback(tr):

2868

def finalize_callback(tr):

2868

opener.rename(

2869

~~opener~~.~~rename~~(

2869

new_index_file_path,

2870

~~new~~_index_file_path,

2870

old_index_file_path,

2871

old_index_file_path,

2871

checkambig=True,

2872

checkambig=True,

2872

)

2873

)

2873

maybe_self = weak_self()

2874

maybe_self = ~~weak_self~~()

2874

if maybe_self is not None:

2875

if maybe_self is not None:

2875

maybe_self._indexfile = old_index_file_path

2876

maybe_self._indexfile = ~~old_index_file_path~~

2876

maybe_self._inner.index_file = maybe_self._indexfile

2877

maybe_self._inner.index_file = maybe_self._indexfile

2877

2878

def abort_callback(tr):

2879

def abort_callback(tr):

2879

maybe_self = weak_self()

2880

maybe_self = ~~weak_self~~()

2880

if maybe_self is not None:

2881

if maybe_self is not None:

2881

maybe_self._indexfile = old_index_file_path

2882

maybe_self._in~~dexfil~~e = ~~old_index_file_path~~

2882

maybe_self._inner.inline = True

2883

maybe_self._inner.in~~lin~~e = ~~True~~

2883

maybe_self._inner.index_file = old_index_file_path

2884

maybe_self._inner.index_file = old_index_file_path

2884

2885

tr.registertmp(new_index_file_path)

2886

tr.registertmp(new_index_file_path)

2886

if self.target[1] is not None:

2887

if self.target[1] is not None:

2887

callback_id = b'000-revlog-split-%d-%s' % self.target

2888

callback_id = b'000-revlog-split-%d-%s' % self.target

2888

else:

2889

else:

2889

callback_id = b'000-revlog-split-%d' % self.target[0]

2890

callback_id = b'000-revlog-split-%d' % self.target[0]

2890

tr.addfinalize(callback_id, finalize_callback)

2891

tr.add~~finalize~~(callback_id, ~~finalize~~_callback)

2891

tr.addabort(callback_id, abort_callback)

2892

tr.addabort(callback_id, abort_callback)

2893

2892

2894

self._format_flags &= ~FLAG_INLINE_DATA

2893

self._format_flags &= ~FLAG_INLINE_DATA

2895

self._inner.split_inline(

2894

self._inner.split_inline(

2896

tr,

2895

tr,

2897

self._format_flags | self._format_version,

2896

self._format_flags | self._format_version,

2898

new_index_file_path=new_index_file_path,

2897

new_index_file_path=new_index_file_path,

2899

)

2898

)

2900

2899

2901

self._inline = False

2900

self._inline = False

2902

if new_index_file_path is not None:

2901

if new_index_file_path is not None:

2903

self._indexfile = new_index_file_path

2902

self._indexfile = new_index_file_path

2904

2903

2905

nodemaputil.setup_persistent_nodemap(tr, self)

2904

nodemaputil.setup_persistent_nodemap(tr, self)

2906

2905

2907

def _nodeduplicatecallback(self, transaction, node):

2906

def _nodeduplicatecallback(self, transaction, node):

2908

"""called when trying to add a node already stored."""

2907

"""called when trying to add a node already stored."""

2909

2908

2910

@contextlib.contextmanager

2909

@contextlib.contextmanager

2911

def reading(self):

2910

def reading(self):

2912

with self._inner.reading():

2911

with self._inner.reading():

2913

yield

2912

yield

2914

2913

2915

@contextlib.contextmanager

2914

@contextlib.contextmanager

2916

def _writing(self, transaction):

2915

def _writing(self, transaction):

2917

if self._trypending:

2916

if self._trypending:

2918

msg = b'try to write in a `trypending` revlog: %s'

2917

msg = b'try to write in a `trypending` revlog: %s'

2919

msg %= self.display_id

2918

msg %= self.display_id

2920

raise error.ProgrammingError(msg)

2919

raise error.ProgrammingError(msg)

2921

if self._inner.is_writing:

2920

if self._inner.is_writing:

2922

yield

2921

yield

2923

else:

2922

else:

2924

data_end = None

2923

data_end = None

2925

sidedata_end = None

2924

sidedata_end = None

2926

if self._docket is not None:

2925

if self._docket is not None:

2927

data_end = self._docket.data_end

2926

data_end = self._docket.data_end

2928

sidedata_end = self._docket.sidedata_end

2927

sidedata_end = self._docket.sidedata_end

2929

with self._inner.writing(

2928

with self._inner.writing(

2930

transaction,

2929

transaction,

2931

data_end=data_end,

2930

data_end=data_end,

2932

sidedata_end=sidedata_end,

2931

sidedata_end=sidedata_end,

2933

):

2932

):

2934

yield

2933

yield

2935

if self._docket is not None:

2934

if self._docket is not None:

2936

self._write_docket(transaction)

2935

self._write_docket(transaction)

2937

2936

2938

@property

2937

@property

2939

def is_delaying(self):

2938

def is_delaying(self):

2940

return self._inner.is_delaying

2939

return self._inner.is_delaying

2941

2940

2942

def _write_docket(self, transaction):

2941

def _write_docket(self, transaction):

2943

"""write the current docket on disk

2942

"""write the current docket on disk

2944

2943

2945

Exist as a method to help changelog to implement transaction logic

2944

Exist as a method to help changelog to implement transaction logic

2946

2945

2947

We could also imagine using the same transaction logic for all revlog

2946

We could also imagine using the same transaction logic for all revlog

2948

since docket are cheap."""

2947

since docket are cheap."""

2949

self._docket.write(transaction)

2948

self._docket.write(transaction)

2950

2949

2951

def addrevision(

2950

def addrevision(

2952

self,

2951

self,

2953

text,

2952

text,

2954

transaction,

2953

transaction,

2955

link,

2954

link,

2956

p1,

2955

p1,

2957

p2,

2956

p2,

2958

cachedelta=None,

2957

cachedelta=None,

2959

node=None,

2958

node=None,

2960

flags=REVIDX_DEFAULT_FLAGS,

2959

flags=REVIDX_DEFAULT_FLAGS,

2961

deltacomputer=None,

2960

deltacomputer=None,

2962

sidedata=None,

2961

sidedata=None,

2963

):

2962

):

2964

"""add a revision to the log

2963

"""add a revision to the log

2965

2964

2966

text - the revision data to add

2965

text - the revision data to add

2967

transaction - the transaction object used for rollback

2966

transaction - the transaction object used for rollback

2968

link - the linkrev data to add

2967

link - the linkrev data to add

2969

p1, p2 - the parent nodeids of the revision

2968

p1, p2 - the parent nodeids of the revision

2970

cachedelta - an optional precomputed delta

2969

cachedelta - an optional precomputed delta

2971

node - nodeid of revision; typically node is not specified, and it is

2970

node - nodeid of revision; typically node is not specified, and it is

2972

computed by default as hash(text, p1, p2), however subclasses might

2971

computed by default as hash(text, p1, p2), however subclasses might

2973

use different hashing method (and override checkhash() in such case)

2972

use different hashing method (and override checkhash() in such case)

2974

flags - the known flags to set on the revision

2973

flags - the known flags to set on the revision

2975

deltacomputer - an optional deltacomputer instance shared between

2974

deltacomputer - an optional deltacomputer instance shared between

2976

multiple calls

2975

multiple calls

2977

"""

2976

"""

2978

if link == nullrev:

2977

if link == nullrev:

2979

raise error.RevlogError(

2978

raise error.RevlogError(

2980

_(b"attempted to add linkrev -1 to %s") % self.display_id

2979

_(b"attempted to add linkrev -1 to %s") % self.display_id

2981

)

2980

)

2982

2981

2983

if sidedata is None:

2982

if sidedata is None:

2984

sidedata = {}

2983

sidedata = {}

2985

elif sidedata and not self.feature_config.has_side_data:

2984

elif sidedata and not self.feature_config.has_side_data:

2986

raise error.ProgrammingError(

2985

raise error.ProgrammingError(

2987

_(b"trying to add sidedata to a revlog who don't support them")

2986

_(b"trying to add sidedata to a revlog who don't support them")

2988

)

2987

)

2989

2988

2990

if flags:

2989

if flags:

2991

node = node or self.hash(text, p1, p2)

2990

node = node or self.hash(text, p1, p2)

2992

2991

2993

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2992

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2994

2993

2995

# If the flag processor modifies the revision data, ignore any provided

2994

# If the flag processor modifies the revision data, ignore any provided

2996

# cachedelta.

2995

# cachedelta.

2997

if rawtext != text:

2996

if rawtext != text:

2998

cachedelta = None

2997

cachedelta = None

2999

2998

3000

if len(rawtext) > _maxentrysize:

2999

if len(rawtext) > _maxentrysize:

3001

raise error.RevlogError(

3000

raise error.RevlogError(

3002

_(

3001

_(

3003

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

3002

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

3004

)

3003

)

3005

% (self.display_id, len(rawtext))

3004

% (self.display_id, len(rawtext))

3006

)

3005

)

3007

3006

3008

node = node or self.hash(rawtext, p1, p2)

3007

node = node or self.hash(rawtext, p1, p2)

3009

rev = self.index.get_rev(node)

3008

rev = self.index.get_rev(node)

3010

if rev is not None:

3009

if rev is not None:

3011

return rev

3010

return rev

3012

3011

3013

if validatehash:

3012

if validatehash:

3014

self.checkhash(rawtext, node, p1=p1, p2=p2)

3013

self.checkhash(rawtext, node, p1=p1, p2=p2)

3015

3014

3016

return self.addrawrevision(

3015

return self.addrawrevision(

3017

rawtext,

3016

rawtext,

3018

transaction,

3017

transaction,

3019

link,

3018

link,

3020

p1,

3019

p1,

3021

p2,

3020

p2,

3022

node,

3021

node,

3023

flags,

3022

flags,

3024

cachedelta=cachedelta,

3023

cachedelta=cachedelta,

3025

deltacomputer=deltacomputer,

3024

deltacomputer=deltacomputer,

3026

sidedata=sidedata,

3025

sidedata=sidedata,

3027

)

3026

)

3028

3027

3029

def addrawrevision(

3028

def addrawrevision(

3030

self,

3029

self,

3031

rawtext,

3030

rawtext,

3032

transaction,

3031

transaction,

3033

link,

3032

link,

3034

p1,

3033

p1,

3035

p2,

3034

p2,

3036

node,

3035

node,

3037

flags,

3036

flags,

3038

cachedelta=None,

3037

cachedelta=None,

3039

deltacomputer=None,

3038

deltacomputer=None,

3040

sidedata=None,

3039

sidedata=None,

3041

):

3040

):

3042

"""add a raw revision with known flags, node and parents

3041

"""add a raw revision with known flags, node and parents

3043

useful when reusing a revision not stored in this revlog (ex: received

3042

useful when reusing a revision not stored in this revlog (ex: received

3044

over wire, or read from an external bundle).

3043

over wire, or read from an external bundle).

3045

"""

3044

"""

3046

with self._writing(transaction):

3045

with self._writing(transaction):

3047

return self._addrevision(

3046

return self._addrevision(

3048

node,

3047

node,

3049

rawtext,

3048

rawtext,

3050

transaction,

3049

transaction,

3051

link,

3050

link,

3052

p1,

3051

p1,

3053

p2,

3052

p2,

3054

flags,

3053

flags,

3055

cachedelta,

3054

cachedelta,

3056

deltacomputer=deltacomputer,

3055

deltacomputer=deltacomputer,

3057

sidedata=sidedata,

3056

sidedata=sidedata,

3058

)

3057

)

3059

3058

3060

def compress(self, data):

3059

def compress(self, data):

3061

return self._inner.compress(data)

3060

return self._inner.compress(data)

3062

3061

3063

def decompress(self, data):

3062

def decompress(self, data):

3064

return self._inner.decompress(data)

3063

return self._inner.decompress(data)

3065

3064

3066

def _addrevision(

3065

def _addrevision(

3067

self,

3066

self,

3068

node,

3067

node,

3069

rawtext,

3068

rawtext,

3070

transaction,

3069

transaction,

3071

link,

3070

link,

3072

p1,

3071

p1,

3073

p2,

3072

p2,

3074

flags,

3073

flags,

3075

cachedelta,

3074

cachedelta,

3076

alwayscache=False,

3075

alwayscache=False,

3077

deltacomputer=None,

3076

deltacomputer=None,

3078

sidedata=None,

3077

sidedata=None,

3079

):

3078

):

3080

"""internal function to add revisions to the log

3079

"""internal function to add revisions to the log

3081

3080

3082

see addrevision for argument descriptions.

3081

see addrevision for argument descriptions.

3083

3082

3084

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

3083

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

3085

3084

3086

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

3085

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

3087

be used.

3086

be used.

3088

3087

3089

invariants:

3088

invariants:

3090

- rawtext is optional (can be None); if not set, cachedelta must be set.

3089

- rawtext is optional (can be None); if not set, cachedelta must be set.

3091

if both are set, they must correspond to each other.

3090

if both are set, they must correspond to each other.

3092

"""

3091

"""

3093

if node == self.nullid:

3092

if node == self.nullid:

3094

raise error.RevlogError(

3093

raise error.RevlogError(

3095

_(b"%s: attempt to add null revision") % self.display_id

3094

_(b"%s: attempt to add null revision") % self.display_id

3096

)

3095

)

3097

if (

3096

if (

3098

node == self.nodeconstants.wdirid

3097

node == self.nodeconstants.wdirid

3099

or node in self.nodeconstants.wdirfilenodeids

3098

or node in self.nodeconstants.wdirfilenodeids

3100

):

3099

):

3101

raise error.RevlogError(

3100

raise error.RevlogError(

3102

_(b"%s: attempt to add wdir revision") % self.display_id

3101

_(b"%s: attempt to add wdir revision") % self.display_id

3103

)

3102

)

3104

if self._inner._writinghandles is None:

3103

if self._inner._writinghandles is None:

3105

msg = b'adding revision outside `revlog._writing` context'

3104

msg = b'adding revision outside `revlog._writing` context'

3106

raise error.ProgrammingError(msg)

3105

raise error.ProgrammingError(msg)

3107

3106

3108

btext = [rawtext]

3107

btext = [rawtext]

3109

3108

3110

curr = len(self)

3109

curr = len(self)

3111

prev = curr - 1

3110

prev = curr - 1

3112

3111

3113

offset = self._get_data_offset(prev)

3112

offset = self._get_data_offset(prev)

3114

3113

3115

if self._concurrencychecker:

3114

if self._concurrencychecker:

3116

ifh, dfh, sdfh = self._inner._writinghandles

3115

ifh, dfh, sdfh = self._inner._writinghandles

3117

# XXX no checking for the sidedata file

3116

# XXX no checking for the sidedata file

3118

if self._inline:

3117

if self._inline:

3119

# offset is "as if" it were in the .d file, so we need to add on

3118

# offset is "as if" it were in the .d file, so we need to add on

3120

# the size of the entry metadata.

3119

# the size of the entry metadata.

3121

self._concurrencychecker(

3120

self._concurrencychecker(

3122

ifh, self._indexfile, offset + curr * self.index.entry_size

3121

ifh, self._indexfile, offset + curr * self.index.entry_size

3123

)

3122

)

3124

else:

3123

else:

3125

# Entries in the .i are a consistent size.

3124

# Entries in the .i are a consistent size.

3126

self._concurrencychecker(

3125

self._concurrencychecker(

3127

ifh, self._indexfile, curr * self.index.entry_size

3126

ifh, self._indexfile, curr * self.index.entry_size

3128

)

3127

)

3129

self._concurrencychecker(dfh, self._datafile, offset)

3128

self._concurrencychecker(dfh, self._datafile, offset)

3130

3129

3131

p1r, p2r = self.rev(p1), self.rev(p2)

3130

p1r, p2r = self.rev(p1), self.rev(p2)

3132

3131

3133

# full versions are inserted when the needed deltas

3132

# full versions are inserted when the needed deltas

3134

# become comparable to the uncompressed text

3133

# become comparable to the uncompressed text

3135

if rawtext is None:

3134

if rawtext is None:

3136

# need rawtext size, before changed by flag processors, which is

3135

# need rawtext size, before changed by flag processors, which is

3137

# the non-raw size. use revlog explicitly to avoid filelog's extra

3136

# the non-raw size. use revlog explicitly to avoid filelog's extra

3138

# logic that might remove metadata size.

3137

# logic that might remove metadata size.

3139

textlen = mdiff.patchedsize(

3138

textlen = mdiff.patchedsize(

3140

revlog.size(self, cachedelta[0]), cachedelta[1]

3139

revlog.size(self, cachedelta[0]), cachedelta[1]

3141

)

3140

)

3142

else:

3141

else:

3143

textlen = len(rawtext)

3142

textlen = len(rawtext)

3144

3143

3145

if deltacomputer is None:

3144

if deltacomputer is None:

3146

write_debug = None

3145

write_debug = None

3147

if self.delta_config.debug_delta:

3146

if self.delta_config.debug_delta:

3148

write_debug = transaction._report

3147

write_debug = transaction._report

3149

deltacomputer = deltautil.deltacomputer(

3148

deltacomputer = deltautil.deltacomputer(

3150

self, write_debug=write_debug

3149

self, write_debug=write_debug

3151

)

3150

)

3152

3151

3153

if cachedelta is not None and len(cachedelta) == 2:

3152

if cachedelta is not None and len(cachedelta) == 2:

3154

# If the cached delta has no information about how it should be

3153

# If the cached delta has no information about how it should be

3155

# reused, add the default reuse instruction according to the

3154

# reused, add the default reuse instruction according to the

3156

# revlog's configuration.

3155

# revlog's configuration.

3157

if (

3156

if (

3158

self.delta_config.general_delta

3157

self.delta_config.general_delta

3159

and self.delta_config.lazy_delta_base

3158

and self.delta_config.lazy_delta_base

3160

):

3159

):

3161

delta_base_reuse = DELTA_BASE_REUSE_TRY

3160

delta_base_reuse = DELTA_BASE_REUSE_TRY

3162

else:

3161

else:

3163

delta_base_reuse = DELTA_BASE_REUSE_NO

3162

delta_base_reuse = DELTA_BASE_REUSE_NO

3164

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

3163

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

3165

3164

3166

revinfo = revlogutils.revisioninfo(

3165

revinfo = revlogutils.revisioninfo(

3167

node,

3166

node,

3168

p1,

3167

p1,

3169

p2,

3168

p2,

3170

btext,

3169

btext,

3171

textlen,

3170

textlen,

3172

cachedelta,

3171

cachedelta,

3173

flags,

3172

flags,

3174

)

3173

)

3175

3174

3176

deltainfo = deltacomputer.finddeltainfo(revinfo)

3175

deltainfo = deltacomputer.finddeltainfo(revinfo)

3177

3176

3178

compression_mode = COMP_MODE_INLINE

3177

compression_mode = COMP_MODE_INLINE

3179

if self._docket is not None:

3178

if self._docket is not None:

3180

default_comp = self._docket.default_compression_header

3179

default_comp = self._docket.default_compression_header

3181

r = deltautil.delta_compression(default_comp, deltainfo)

3180

r = deltautil.delta_compression(default_comp, deltainfo)

3182

compression_mode, deltainfo = r

3181

compression_mode, deltainfo = r

3183

3182

3184

sidedata_compression_mode = COMP_MODE_INLINE

3183

sidedata_compression_mode = COMP_MODE_INLINE

3185

if sidedata and self.feature_config.has_side_data:

3184

if sidedata and self.feature_config.has_side_data:

3186

sidedata_compression_mode = COMP_MODE_PLAIN

3185

sidedata_compression_mode = COMP_MODE_PLAIN

3187

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

3186

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

3188

sidedata_offset = self._docket.sidedata_end

3187

sidedata_offset = self._docket.sidedata_end

3189

h, comp_sidedata = self._inner.compress(serialized_sidedata)

3188

h, comp_sidedata = self._inner.compress(serialized_sidedata)

3190

if (

3189

if (

3191

h != b'u'

3190

h != b'u'

3192

and comp_sidedata[0:1] != b'\0'

3191

and comp_sidedata[0:1] != b'\0'

3193

and len(comp_sidedata) < len(serialized_sidedata)

3192

and len(comp_sidedata) < len(serialized_sidedata)

3194

):

3193

):

3195

assert not h

3194

assert not h

3196

if (

3195

if (

3197

comp_sidedata[0:1]

3196

comp_sidedata[0:1]

3198

== self._docket.default_compression_header

3197

== self._docket.default_compression_header

3199

):

3198

):

3200

sidedata_compression_mode = COMP_MODE_DEFAULT

3199

sidedata_compression_mode = COMP_MODE_DEFAULT

3201

serialized_sidedata = comp_sidedata

3200

serialized_sidedata = comp_sidedata

3202

else:

3201

else:

3203

sidedata_compression_mode = COMP_MODE_INLINE

3202

sidedata_compression_mode = COMP_MODE_INLINE

3204

serialized_sidedata = comp_sidedata

3203

serialized_sidedata = comp_sidedata

3205

else:

3204

else:

3206

serialized_sidedata = b""

3205

serialized_sidedata = b""

3207

# Don't store the offset if the sidedata is empty, that way

3206

# Don't store the offset if the sidedata is empty, that way

3208

# we can easily detect empty sidedata and they will be no different

3207

# we can easily detect empty sidedata and they will be no different

3209

# than ones we manually add.

3208

# than ones we manually add.

3210

sidedata_offset = 0

3209

sidedata_offset = 0

3211

3210

3212

rank = RANK_UNKNOWN

3211

rank = RANK_UNKNOWN

3213

if self.feature_config.compute_rank:

3212

if self.feature_config.compute_rank:

3214

if (p1r, p2r) == (nullrev, nullrev):

3213

if (p1r, p2r) == (nullrev, nullrev):

3215

rank = 1

3214

rank = 1

3216

elif p1r != nullrev and p2r == nullrev:

3215

elif p1r != nullrev and p2r == nullrev:

3217

rank = 1 + self.fast_rank(p1r)

3216

rank = 1 + self.fast_rank(p1r)

3218

elif p1r == nullrev and p2r != nullrev:

3217

elif p1r == nullrev and p2r != nullrev:

3219

rank = 1 + self.fast_rank(p2r)

3218

rank = 1 + self.fast_rank(p2r)

3220

else: # merge node

3219

else: # merge node

3221

if rustdagop is not None and self.index.rust_ext_compat:

3220

if rustdagop is not None and self.index.rust_ext_compat:

3222

rank = rustdagop.rank(self.index, p1r, p2r)

3221

rank = rustdagop.rank(self.index, p1r, p2r)

3223

else:

3222

else:

3224

pmin, pmax = sorted((p1r, p2r))

3223

pmin, pmax = sorted((p1r, p2r))

3225

rank = 1 + self.fast_rank(pmax)

3224

rank = 1 + self.fast_rank(pmax)

3226

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

3225

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

3227

3226

3228

e = revlogutils.entry(

3227

e = revlogutils.entry(

3229

flags=flags,

3228

flags=flags,

3230

data_offset=offset,

3229

data_offset=offset,

3231

data_compressed_length=deltainfo.deltalen,

3230

data_compressed_length=deltainfo.deltalen,

3232

data_uncompressed_length=textlen,

3231

data_uncompressed_length=textlen,

3233

data_compression_mode=compression_mode,

3232

data_compression_mode=compression_mode,

3234

data_delta_base=deltainfo.base,

3233

data_delta_base=deltainfo.base,

3235

link_rev=link,

3234

link_rev=link,

3236

parent_rev_1=p1r,

3235

parent_rev_1=p1r,

3237

parent_rev_2=p2r,

3236

parent_rev_2=p2r,

3238

node_id=node,

3237

node_id=node,

3239

sidedata_offset=sidedata_offset,

3238

sidedata_offset=sidedata_offset,

3240

sidedata_compressed_length=len(serialized_sidedata),

3239

sidedata_compressed_length=len(serialized_sidedata),

3241

sidedata_compression_mode=sidedata_compression_mode,

3240

sidedata_compression_mode=sidedata_compression_mode,

3242

rank=rank,

3241

rank=rank,

3243

)

3242

)

3244

3243

3245

self.index.append(e)

3244

self.index.append(e)

3246

entry = self.index.entry_binary(curr)

3245

entry = self.index.entry_binary(curr)

3247

if curr == 0 and self._docket is None:

3246

if curr == 0 and self._docket is None:

3248

header = self._format_flags | self._format_version

3247

header = self._format_flags | self._format_version

3249

header = self.index.pack_header(header)

3248

header = self.index.pack_header(header)

3250

entry = header + entry

3249

entry = header + entry

3251

self._writeentry(

3250

self._writeentry(

3252

transaction,

3251

transaction,

3253

entry,

3252

entry,

3254

deltainfo.data,

3253

deltainfo.data,

3255

link,

3254

link,

3256

offset,

3255

offset,

3257

serialized_sidedata,

3256

serialized_sidedata,

3258

sidedata_offset,

3257

sidedata_offset,

3259

)

3258

)

3260

3259

3261

rawtext = btext[0]

3260

rawtext = btext[0]

3262

3261

3263

if alwayscache and rawtext is None:

3262

if alwayscache and rawtext is None:

3264

rawtext = deltacomputer.buildtext(revinfo)

3263

rawtext = deltacomputer.buildtext(revinfo)

3265

3264

3266

if type(rawtext) == bytes: # only accept immutable objects

3265

if type(rawtext) == bytes: # only accept immutable objects

3267

self._inner._revisioncache = (node, curr, rawtext)

3266

self._inner._revisioncache = (node, curr, rawtext)

3268

self._chainbasecache[curr] = deltainfo.chainbase

3267

self._chainbasecache[curr] = deltainfo.chainbase

3269

return curr

3268

return curr

3270

3269

3271

def _get_data_offset(self, prev):

3270

def _get_data_offset(self, prev):

3272

"""Returns the current offset in the (in-transaction) data file.

3271

"""Returns the current offset in the (in-transaction) data file.

3273

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

3272

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

3274

file to store that information: since sidedata can be rewritten to the

3273

file to store that information: since sidedata can be rewritten to the

3275

end of the data file within a transaction, you can have cases where, for

3274

end of the data file within a transaction, you can have cases where, for

3276

example, rev `n` does not have sidedata while rev `n - 1` does, leading

3275

example, rev `n` does not have sidedata while rev `n - 1` does, leading

3277

to `n - 1`'s sidedata being written after `n`'s data.

3276

to `n - 1`'s sidedata being written after `n`'s data.

3278

3277

3279

TODO cache this in a docket file before getting out of experimental."""

3278

TODO cache this in a docket file before getting out of experimental."""

3280

if self._docket is None:

3279

if self._docket is None:

3281

return self.end(prev)

3280

return self.end(prev)

3282

else:

3281

else:

3283

return self._docket.data_end

3282

return self._docket.data_end

3284

3283

3285

def _writeentry(

3284

def _writeentry(

3286

self,

3285

self,

3287

transaction,

3286

transaction,

3288

entry,

3287

entry,

3289

data,

3288

data,

3290

link,

3289

link,

3291

offset,

3290

offset,

3292

sidedata,

3291

sidedata,

3293

sidedata_offset,

3292

sidedata_offset,

3294

):

3293

):

3295

# Files opened in a+ mode have inconsistent behavior on various

3294

# Files opened in a+ mode have inconsistent behavior on various

3296

# platforms. Windows requires that a file positioning call be made

3295

# platforms. Windows requires that a file positioning call be made

3297

# when the file handle transitions between reads and writes. See

3296

# when the file handle transitions between reads and writes. See

3298

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

3297

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

3299

# platforms, Python or the platform itself can be buggy. Some versions

3298

# platforms, Python or the platform itself can be buggy. Some versions

3300

# of Solaris have been observed to not append at the end of the file

3299

# of Solaris have been observed to not append at the end of the file

3301

# if the file was seeked to before the end. See issue4943 for more.

3300

# if the file was seeked to before the end. See issue4943 for more.

3302

#

3301

#

3303

# We work around this issue by inserting a seek() before writing.

3302

# We work around this issue by inserting a seek() before writing.

3304

# Note: This is likely not necessary on Python 3. However, because

3303

# Note: This is likely not necessary on Python 3. However, because

3305

# the file handle is reused for reads and may be seeked there, we need

3304

# the file handle is reused for reads and may be seeked there, we need

3306

# to be careful before changing this.

3305

# to be careful before changing this.

3307

index_end = data_end = sidedata_end = None

3306

index_end = data_end = sidedata_end = None

3308

if self._docket is not None:

3307

if self._docket is not None:

3309

index_end = self._docket.index_end

3308

index_end = self._docket.index_end

3310

data_end = self._docket.data_end

3309

data_end = self._docket.data_end

3311

sidedata_end = self._docket.sidedata_end

3310

sidedata_end = self._docket.sidedata_end

3312

3311

3313

files_end = self._inner.write_entry(

3312

files_end = self._inner.write_entry(

3314

transaction,

3313

transaction,

3315

entry,

3314

entry,

3316

data,

3315

data,

3317

link,

3316

link,

3318

offset,

3317

offset,

3319

sidedata,

3318

sidedata,

3320

sidedata_offset,

3319

sidedata_offset,

3321

index_end,

3320

index_end,

3322

data_end,

3321

data_end,

3323

sidedata_end,

3322

sidedata_end,

3324

)

3323

)

3325

self._enforceinlinesize(transaction)

3324

self._enforceinlinesize(transaction)

3326

if self._docket is not None:

3325

if self._docket is not None:

3327

self._docket.index_end = files_end[0]

3326

self._docket.index_end = files_end[0]

3328

self._docket.data_end = files_end[1]

3327

self._docket.data_end = files_end[1]

3329

self._docket.sidedata_end = files_end[2]

3328

self._docket.sidedata_end = files_end[2]

3330

3329

3331

nodemaputil.setup_persistent_nodemap(transaction, self)

3330

nodemaputil.setup_persistent_nodemap(transaction, self)

3332

3331

3333

def addgroup(

3332

def addgroup(

3334

self,

3333

self,

3335

deltas,

3334

deltas,

3336

linkmapper,

3335

linkmapper,

3337

transaction,

3336

transaction,

3338

alwayscache=False,

3337

alwayscache=False,

3339

addrevisioncb=None,

3338

addrevisioncb=None,

3340

duplicaterevisioncb=None,

3339

duplicaterevisioncb=None,

3341

debug_info=None,

3340

debug_info=None,

3342

delta_base_reuse_policy=None,

3341

delta_base_reuse_policy=None,

3343

):

3342

):

3344

"""

3343

"""

3345

add a delta group

3344

add a delta group

3346

3345

3347

given a set of deltas, add them to the revision log. the

3346

given a set of deltas, add them to the revision log. the

3348

first delta is against its parent, which should be in our

3347

first delta is against its parent, which should be in our

3349

log, the rest are against the previous delta.

3348

log, the rest are against the previous delta.

3350

3349

3351

If ``addrevisioncb`` is defined, it will be called with arguments of

3350

If ``addrevisioncb`` is defined, it will be called with arguments of

3352

this revlog and the node that was added.

3351

this revlog and the node that was added.

3353

"""

3352

"""

3354

3353

3355

if self._adding_group:

3354

if self._adding_group:

3356

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3355

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3357

3356

3358

# read the default delta-base reuse policy from revlog config if the

3357

# read the default delta-base reuse policy from revlog config if the

3359

# group did not specify one.

3358

# group did not specify one.

3360

if delta_base_reuse_policy is None:

3359

if delta_base_reuse_policy is None:

3361

if (

3360

if (

3362

self.delta_config.general_delta

3361

self.delta_config.general_delta

3363

and self.delta_config.lazy_delta_base

3362

and self.delta_config.lazy_delta_base

3364

):

3363

):

3365

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3364

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3366

else:

3365

else:

3367

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3366

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3368

3367

3369

self._adding_group = True

3368

self._adding_group = True

3370

empty = True

3369

empty = True

3371

try:

3370

try:

3372

with self._writing(transaction):

3371

with self._writing(transaction):

3373

write_debug = None

3372

write_debug = None

3374

if self.delta_config.debug_delta:

3373

if self.delta_config.debug_delta:

3375

write_debug = transaction._report

3374

write_debug = transaction._report

3376

deltacomputer = deltautil.deltacomputer(

3375

deltacomputer = deltautil.deltacomputer(

3377

self,

3376

self,

3378

write_debug=write_debug,

3377

write_debug=write_debug,

3379

debug_info=debug_info,

3378

debug_info=debug_info,

3380

)

3379

)

3381

# loop through our set of deltas

3380

# loop through our set of deltas

3382

for data in deltas:

3381

for data in deltas:

3383

(

3382

(

3384

node,

3383

node,

3385

p1,

3384

p1,

3386

p2,

3385

p2,

3387

linknode,

3386

linknode,

3388

deltabase,

3387

deltabase,

3389

delta,

3388

delta,

3390

flags,

3389

flags,

3391

sidedata,

3390

sidedata,

3392

) = data

3391

) = data

3393

link = linkmapper(linknode)

3392

link = linkmapper(linknode)

3394

flags = flags or REVIDX_DEFAULT_FLAGS

3393

flags = flags or REVIDX_DEFAULT_FLAGS

3395

3394

3396

rev = self.index.get_rev(node)

3395

rev = self.index.get_rev(node)

3397

if rev is not None:

3396

if rev is not None:

3398

# this can happen if two branches make the same change

3397

# this can happen if two branches make the same change

3399

self._nodeduplicatecallback(transaction, rev)

3398

self._nodeduplicatecallback(transaction, rev)

3400

if duplicaterevisioncb:

3399

if duplicaterevisioncb:

3401

duplicaterevisioncb(self, rev)

3400

duplicaterevisioncb(self, rev)

3402

empty = False

3401

empty = False

3403

continue

3402

continue

3404

3403

3405

for p in (p1, p2):

3404

for p in (p1, p2):

3406

if not self.index.has_node(p):

3405

if not self.index.has_node(p):

3407

raise error.LookupError(

3406

raise error.LookupError(

3408

p, self.radix, _(b'unknown parent')

3407

p, self.radix, _(b'unknown parent')

3409

)

3408

)

3410

3409

3411

if not self.index.has_node(deltabase):

3410

if not self.index.has_node(deltabase):

3412

raise error.LookupError(

3411

raise error.LookupError(

3413

deltabase, self.display_id, _(b'unknown delta base')

3412

deltabase, self.display_id, _(b'unknown delta base')

3414

)

3413

)

3415

3414

3416

baserev = self.rev(deltabase)

3415

baserev = self.rev(deltabase)

3417

3416

3418

if baserev != nullrev and self.iscensored(baserev):

3417

if baserev != nullrev and self.iscensored(baserev):

3419

# if base is censored, delta must be full replacement in a

3418

# if base is censored, delta must be full replacement in a

3420

# single patch operation

3419

# single patch operation

3421

hlen = struct.calcsize(b">lll")

3420

hlen = struct.calcsize(b">lll")

3422

oldlen = self.rawsize(baserev)

3421

oldlen = self.rawsize(baserev)

3423

newlen = len(delta) - hlen

3422

newlen = len(delta) - hlen

3424

if delta[:hlen] != mdiff.replacediffheader(

3423

if delta[:hlen] != mdiff.replacediffheader(

3425

oldlen, newlen

3424

oldlen, newlen

3426

):

3425

):

3427

raise error.CensoredBaseError(

3426

raise error.CensoredBaseError(

3428

self.display_id, self.node(baserev)

3427

self.display_id, self.node(baserev)

3429

)

3428

)

3430

3429

3431

if not flags and self._peek_iscensored(baserev, delta):

3430

if not flags and self._peek_iscensored(baserev, delta):

3432

flags |= REVIDX_ISCENSORED

3431

flags |= REVIDX_ISCENSORED

3433

3432

3434

# We assume consumers of addrevisioncb will want to retrieve

3433

# We assume consumers of addrevisioncb will want to retrieve

3435

# the added revision, which will require a call to

3434

# the added revision, which will require a call to

3436

# revision(). revision() will fast path if there is a cache

3435

# revision(). revision() will fast path if there is a cache

3437

# hit. So, we tell _addrevision() to always cache in this case.

3436

# hit. So, we tell _addrevision() to always cache in this case.

3438

# We're only using addgroup() in the context of changegroup

3437

# We're only using addgroup() in the context of changegroup

3439

# generation so the revision data can always be handled as raw

3438

# generation so the revision data can always be handled as raw

3440

# by the flagprocessor.

3439

# by the flagprocessor.

3441

rev = self._addrevision(

3440

rev = self._addrevision(

3442

node,

3441

node,

3443

None,

3442

None,

3444

transaction,

3443

transaction,

3445

link,

3444

link,

3446

p1,

3445

p1,

3447

p2,

3446

p2,

3448

flags,

3447

flags,

3449

(baserev, delta, delta_base_reuse_policy),

3448

(baserev, delta, delta_base_reuse_policy),

3450

alwayscache=alwayscache,

3449

alwayscache=alwayscache,

3451

deltacomputer=deltacomputer,

3450

deltacomputer=deltacomputer,

3452

sidedata=sidedata,

3451

sidedata=sidedata,

3453

)

3452

)

3454

3453

3455

if addrevisioncb:

3454

if addrevisioncb:

3456

addrevisioncb(self, rev)

3455

addrevisioncb(self, rev)

3457

empty = False

3456

empty = False

3458

finally:

3457

finally:

3459

self._adding_group = False

3458

self._adding_group = False

3460

return not empty

3459

return not empty

3461

3460

3462

def iscensored(self, rev):

3461

def iscensored(self, rev):

3463

"""Check if a file revision is censored."""

3462

"""Check if a file revision is censored."""

3464

if not self.feature_config.censorable:

3463

if not self.feature_config.censorable:

3465

return False

3464

return False

3466

3465

3467

return self.flags(rev) & REVIDX_ISCENSORED

3466

return self.flags(rev) & REVIDX_ISCENSORED

3468

3467

3469

def _peek_iscensored(self, baserev, delta):

3468

def _peek_iscensored(self, baserev, delta):

3470

"""Quickly check if a delta produces a censored revision."""

3469

"""Quickly check if a delta produces a censored revision."""

3471

if not self.feature_config.censorable:

3470

if not self.feature_config.censorable:

3472

return False

3471

return False

3473

3472

3474

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3473

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3475

3474

3476

def getstrippoint(self, minlink):

3475

def getstrippoint(self, minlink):

3477

"""find the minimum rev that must be stripped to strip the linkrev

3476

"""find the minimum rev that must be stripped to strip the linkrev

3478

3477

3479

Returns a tuple containing the minimum rev and a set of all revs that

3478

Returns a tuple containing the minimum rev and a set of all revs that

3480

have linkrevs that will be broken by this strip.

3479

have linkrevs that will be broken by this strip.

3481

"""

3480

"""

3482

return storageutil.resolvestripinfo(

3481

return storageutil.resolvestripinfo(

3483

minlink,

3482

minlink,

3484

len(self) - 1,

3483

len(self) - 1,

3485

self.headrevs(),

3484

self.headrevs(),

3486

self.linkrev,

3485

self.linkrev,

3487

self.parentrevs,

3486

self.parentrevs,

3488

)

3487

)

3489

3488

3490

def strip(self, minlink, transaction):

3489

def strip(self, minlink, transaction):

3491

"""truncate the revlog on the first revision with a linkrev >= minlink

3490

"""truncate the revlog on the first revision with a linkrev >= minlink

3492

3491

3493

This function is called when we're stripping revision minlink and

3492

This function is called when we're stripping revision minlink and

3494

its descendants from the repository.

3493

its descendants from the repository.

3495

3494

3496

We have to remove all revisions with linkrev >= minlink, because

3495

We have to remove all revisions with linkrev >= minlink, because

3497

the equivalent changelog revisions will be renumbered after the

3496

the equivalent changelog revisions will be renumbered after the

3498

strip.

3497

strip.

3499

3498

3500

So we truncate the revlog on the first of these revisions, and

3499

So we truncate the revlog on the first of these revisions, and

3501

trust that the caller has saved the revisions that shouldn't be

3500

trust that the caller has saved the revisions that shouldn't be

3502

removed and that it'll re-add them after this truncation.

3501

removed and that it'll re-add them after this truncation.

3503

"""

3502

"""

3504

if len(self) == 0:

3503

if len(self) == 0:

3505

return

3504

return

3506

3505

3507

rev, _ = self.getstrippoint(minlink)

3506

rev, _ = self.getstrippoint(minlink)

3508

if rev == len(self):

3507

if rev == len(self):

3509

return

3508

return

3510

3509

3511

# first truncate the files on disk

3510

# first truncate the files on disk

3512

data_end = self.start(rev)

3511

data_end = self.start(rev)

3513

if not self._inline:

3512

if not self._inline:

3514

transaction.add(self._datafile, data_end)

3513

transaction.add(self._datafile, data_end)

3515

end = rev * self.index.entry_size

3514

end = rev * self.index.entry_size

3516

else:

3515

else:

3517

end = data_end + (rev * self.index.entry_size)

3516

end = data_end + (rev * self.index.entry_size)

3518

3517

3519

if self._sidedatafile:

3518

if self._sidedatafile:

3520

sidedata_end = self.sidedata_cut_off(rev)

3519

sidedata_end = self.sidedata_cut_off(rev)

3521

transaction.add(self._sidedatafile, sidedata_end)

3520

transaction.add(self._sidedatafile, sidedata_end)

3522

3521

3523

transaction.add(self._indexfile, end)

3522

transaction.add(self._indexfile, end)

3524

if self._docket is not None:

3523

if self._docket is not None:

3525

# XXX we could, leverage the docket while stripping. However it is

3524

# XXX we could, leverage the docket while stripping. However it is

3526

# not powerfull enough at the time of this comment

3525

# not powerfull enough at the time of this comment

3527

self._docket.index_end = end

3526

self._docket.index_end = end

3528

self._docket.data_end = data_end

3527

self._docket.data_end = data_end

3529

self._docket.sidedata_end = sidedata_end

3528

self._docket.sidedata_end = sidedata_end

3530

self._docket.write(transaction, stripping=True)

3529

self._docket.write(transaction, stripping=True)

3531

3530

3532

# then reset internal state in memory to forget those revisions

3531

# then reset internal state in memory to forget those revisions

3533

self._chaininfocache = util.lrucachedict(500)

3532

self._chaininfocache = util.lrucachedict(500)

3534

self._inner.clear_cache()

3533

self._inner.clear_cache()

3535

3534

3536

del self.index[rev:-1]

3535

del self.index[rev:-1]

3537

3536

3538

def checksize(self):

3537

def checksize(self):

3539

"""Check size of index and data files

3538

"""Check size of index and data files

3540

3539

3541

return a (dd, di) tuple.

3540

return a (dd, di) tuple.

3542

- dd: extra bytes for the "data" file

3541

- dd: extra bytes for the "data" file

3543

- di: extra bytes for the "index" file

3542

- di: extra bytes for the "index" file

3544

3543

3545

A healthy revlog will return (0, 0).

3544

A healthy revlog will return (0, 0).

3546

"""

3545

"""

3547

expected = 0

3546

expected = 0

3548

if len(self):

3547

if len(self):

3549

expected = max(0, self.end(len(self) - 1))

3548

expected = max(0, self.end(len(self) - 1))

3550

3549

3551

try:

3550

try:

3552

with self._datafp() as f:

3551

with self._datafp() as f:

3553

f.seek(0, io.SEEK_END)

3552

f.seek(0, io.SEEK_END)

3554

actual = f.tell()

3553

actual = f.tell()

3555

dd = actual - expected

3554

dd = actual - expected

3556

except FileNotFoundError:

3555

except FileNotFoundError:

3557

dd = 0

3556

dd = 0

3558

3557

3559

try:

3558

try:

3560

f = self.opener(self._indexfile)

3559

f = self.opener(self._indexfile)

3561

f.seek(0, io.SEEK_END)

3560

f.seek(0, io.SEEK_END)

3562

actual = f.tell()

3561

actual = f.tell()

3563

f.close()

3562

f.close()

3564

s = self.index.entry_size

3563

s = self.index.entry_size

3565

i = max(0, actual // s)

3564

i = max(0, actual // s)

3566

di = actual - (i * s)

3565

di = actual - (i * s)

3567

if self._inline:

3566

if self._inline:

3568

databytes = 0

3567

databytes = 0

3569

for r in self:

3568

for r in self:

3570

databytes += max(0, self.length(r))

3569

databytes += max(0, self.length(r))

3571

dd = 0

3570

dd = 0

3572

di = actual - len(self) * s - databytes

3571

di = actual - len(self) * s - databytes

3573

except FileNotFoundError:

3572

except FileNotFoundError:

3574

di = 0

3573

di = 0

3575

3574

3576

return (dd, di)

3575

return (dd, di)

3577

3576

3578

def files(self):

3577

def files(self):

3579

"""return list of files that compose this revlog"""

3578

"""return list of files that compose this revlog"""

3580

res = [self._indexfile]

3579

res = [self._indexfile]

3581

if self._docket_file is None:

3580

if self._docket_file is None:

3582

if not self._inline:

3581

if not self._inline:

3583

res.append(self._datafile)

3582

res.append(self._datafile)

3584

else:

3583

else:

3585

res.append(self._docket_file)

3584

res.append(self._docket_file)

3586

res.extend(self._docket.old_index_filepaths(include_empty=False))

3585

res.extend(self._docket.old_index_filepaths(include_empty=False))

3587

if self._docket.data_end:

3586

if self._docket.data_end:

3588

res.append(self._datafile)

3587

res.append(self._datafile)

3589

res.extend(self._docket.old_data_filepaths(include_empty=False))

3588

res.extend(self._docket.old_data_filepaths(include_empty=False))

3590

if self._docket.sidedata_end:

3589

if self._docket.sidedata_end:

3591

res.append(self._sidedatafile)

3590

res.append(self._sidedatafile)

3592

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3591

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3593

return res

3592

return res

3594

3593

3595

def emitrevisions(

3594

def emitrevisions(

3596

self,

3595

self,

3597

nodes,

3596

nodes,

3598

nodesorder=None,

3597

nodesorder=None,

3599

revisiondata=False,

3598

revisiondata=False,

3600

assumehaveparentrevisions=False,

3599

assumehaveparentrevisions=False,

3601

deltamode=repository.CG_DELTAMODE_STD,

3600

deltamode=repository.CG_DELTAMODE_STD,

3602

sidedata_helpers=None,

3601

sidedata_helpers=None,

3603

debug_info=None,

3602

debug_info=None,

3604

):

3603

):

3605

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3604

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3606

raise error.ProgrammingError(

3605

raise error.ProgrammingError(

3607

b'unhandled value for nodesorder: %s' % nodesorder

3606

b'unhandled value for nodesorder: %s' % nodesorder

3608

)

3607

)

3609

3608

3610

if nodesorder is None and not self.delta_config.general_delta:

3609

if nodesorder is None and not self.delta_config.general_delta:

3611

nodesorder = b'storage'

3610

nodesorder = b'storage'

3612

3611

3613

if (

3612

if (

3614

not self._storedeltachains

3613

not self._storedeltachains

3615

and deltamode != repository.CG_DELTAMODE_PREV

3614

and deltamode != repository.CG_DELTAMODE_PREV

3616

):

3615

):

3617

deltamode = repository.CG_DELTAMODE_FULL

3616

deltamode = repository.CG_DELTAMODE_FULL

3618

3617

3619

return storageutil.emitrevisions(

3618

return storageutil.emitrevisions(

3620

self,

3619

self,

3621

nodes,

3620

nodes,

3622

nodesorder,

3621

nodesorder,

3623

revlogrevisiondelta,

3622

revlogrevisiondelta,

3624

deltaparentfn=self.deltaparent,

3623

deltaparentfn=self.deltaparent,

3625

candeltafn=self._candelta,

3624

candeltafn=self._candelta,

3626

rawsizefn=self.rawsize,

3625

rawsizefn=self.rawsize,

3627

revdifffn=self.revdiff,

3626

revdifffn=self.revdiff,

3628

flagsfn=self.flags,

3627

flagsfn=self.flags,

3629

deltamode=deltamode,

3628

deltamode=deltamode,

3630

revisiondata=revisiondata,

3629

revisiondata=revisiondata,

3631

assumehaveparentrevisions=assumehaveparentrevisions,

3630

assumehaveparentrevisions=assumehaveparentrevisions,

3632

sidedata_helpers=sidedata_helpers,

3631

sidedata_helpers=sidedata_helpers,

3633

debug_info=debug_info,

3632

debug_info=debug_info,

3634

)

3633

)

3635

3634

3636

DELTAREUSEALWAYS = b'always'

3635

DELTAREUSEALWAYS = b'always'

3637

DELTAREUSESAMEREVS = b'samerevs'

3636

DELTAREUSESAMEREVS = b'samerevs'

3638

DELTAREUSENEVER = b'never'

3637

DELTAREUSENEVER = b'never'

3639

3638

3640

DELTAREUSEFULLADD = b'fulladd'

3639

DELTAREUSEFULLADD = b'fulladd'

3641

3640

3642

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3641

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3643

3642

3644

def clone(

3643

def clone(

3645

self,

3644

self,

3646

tr,

3645

tr,

3647

destrevlog,

3646

destrevlog,

3648

addrevisioncb=None,

3647

addrevisioncb=None,

3649

deltareuse=DELTAREUSESAMEREVS,

3648

deltareuse=DELTAREUSESAMEREVS,

3650

forcedeltabothparents=None,

3649

forcedeltabothparents=None,

3651

sidedata_helpers=None,

3650

sidedata_helpers=None,

3652

):

3651

):

3653

"""Copy this revlog to another, possibly with format changes.

3652

"""Copy this revlog to another, possibly with format changes.

3654

3653

3655

The destination revlog will contain the same revisions and nodes.

3654

The destination revlog will contain the same revisions and nodes.

3656

However, it may not be bit-for-bit identical due to e.g. delta encoding

3655

However, it may not be bit-for-bit identical due to e.g. delta encoding

3657

differences.

3656

differences.

3658

3657

3659

The ``deltareuse`` argument control how deltas from the existing revlog

3658

The ``deltareuse`` argument control how deltas from the existing revlog

3660

are preserved in the destination revlog. The argument can have the

3659

are preserved in the destination revlog. The argument can have the

3661

following values:

3660

following values:

3662

3661

3663

DELTAREUSEALWAYS

3662

DELTAREUSEALWAYS

3664

Deltas will always be reused (if possible), even if the destination

3663

Deltas will always be reused (if possible), even if the destination

3665

revlog would not select the same revisions for the delta. This is the

3664

revlog would not select the same revisions for the delta. This is the

3666

fastest mode of operation.

3665

fastest mode of operation.

3667

DELTAREUSESAMEREVS

3666

DELTAREUSESAMEREVS

3668

Deltas will be reused if the destination revlog would pick the same

3667

Deltas will be reused if the destination revlog would pick the same

3669

revisions for the delta. This mode strikes a balance between speed

3668

revisions for the delta. This mode strikes a balance between speed

3670

and optimization.

3669

and optimization.

3671

DELTAREUSENEVER

3670

DELTAREUSENEVER

3672

Deltas will never be reused. This is the slowest mode of execution.

3671

Deltas will never be reused. This is the slowest mode of execution.

3673

This mode can be used to recompute deltas (e.g. if the diff/delta

3672

This mode can be used to recompute deltas (e.g. if the diff/delta

3674

algorithm changes).

3673

algorithm changes).

3675

DELTAREUSEFULLADD

3674

DELTAREUSEFULLADD

3676

Revision will be re-added as if their were new content. This is

3675

Revision will be re-added as if their were new content. This is

3677

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3676

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3678

eg: large file detection and handling.

3677

eg: large file detection and handling.

3679

3678

3680

Delta computation can be slow, so the choice of delta reuse policy can

3679

Delta computation can be slow, so the choice of delta reuse policy can

3681

significantly affect run time.

3680

significantly affect run time.

3682

3681

3683

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3682

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3684

two extremes. Deltas will be reused if they are appropriate. But if the

3683

two extremes. Deltas will be reused if they are appropriate. But if the

3685

delta could choose a better revision, it will do so. This means if you

3684

delta could choose a better revision, it will do so. This means if you

3686

are converting a non-generaldelta revlog to a generaldelta revlog,

3685

are converting a non-generaldelta revlog to a generaldelta revlog,

3687

deltas will be recomputed if the delta's parent isn't a parent of the

3686

deltas will be recomputed if the delta's parent isn't a parent of the

3688

revision.

3687

revision.

3689

3688

3690

In addition to the delta policy, the ``forcedeltabothparents``

3689

In addition to the delta policy, the ``forcedeltabothparents``

3691

argument controls whether to force compute deltas against both parents

3690

argument controls whether to force compute deltas against both parents

3692

for merges. By default, the current default is used.

3691

for merges. By default, the current default is used.

3693

3692

3694

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3693

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3695

`sidedata_helpers`.

3694

`sidedata_helpers`.

3696

"""

3695

"""

3697

if deltareuse not in self.DELTAREUSEALL:

3696

if deltareuse not in self.DELTAREUSEALL:

3698

raise ValueError(

3697

raise ValueError(

3699

_(b'value for deltareuse invalid: %s') % deltareuse

3698

_(b'value for deltareuse invalid: %s') % deltareuse

3700

)

3699

)

3701

3700

3702

if len(destrevlog):

3701

if len(destrevlog):

3703

raise ValueError(_(b'destination revlog is not empty'))

3702

raise ValueError(_(b'destination revlog is not empty'))

3704

3703

3705

if getattr(self, 'filteredrevs', None):

3704

if getattr(self, 'filteredrevs', None):

3706

raise ValueError(_(b'source revlog has filtered revisions'))

3705

raise ValueError(_(b'source revlog has filtered revisions'))

3707

if getattr(destrevlog, 'filteredrevs', None):

3706

if getattr(destrevlog, 'filteredrevs', None):

3708

raise ValueError(_(b'destination revlog has filtered revisions'))

3707

raise ValueError(_(b'destination revlog has filtered revisions'))

3709

3708

3710

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3709

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3711

# if possible.

3710

# if possible.

3712

old_delta_config = destrevlog.delta_config

3711

old_delta_config = destrevlog.delta_config

3713

destrevlog.delta_config = destrevlog.delta_config.copy()

3712

destrevlog.delta_config = destrevlog.delta_config.copy()

3714

3713

3715

try:

3714

try:

3716

if deltareuse == self.DELTAREUSEALWAYS:

3715

if deltareuse == self.DELTAREUSEALWAYS:

3717

destrevlog.delta_config.lazy_delta_base = True

3716

destrevlog.delta_config.lazy_delta_base = True

3718

destrevlog.delta_config.lazy_delta = True

3717

destrevlog.delta_config.lazy_delta = True

3719

elif deltareuse == self.DELTAREUSESAMEREVS:

3718

elif deltareuse == self.DELTAREUSESAMEREVS:

3720

destrevlog.delta_config.lazy_delta_base = False

3719

destrevlog.delta_config.lazy_delta_base = False

3721

destrevlog.delta_config.lazy_delta = True

3720

destrevlog.delta_config.lazy_delta = True

3722

elif deltareuse == self.DELTAREUSENEVER:

3721

elif deltareuse == self.DELTAREUSENEVER:

3723

destrevlog.delta_config.lazy_delta_base = False

3722

destrevlog.delta_config.lazy_delta_base = False

3724

destrevlog.delta_config.lazy_delta = False

3723

destrevlog.delta_config.lazy_delta = False

3725

3724

3726

delta_both_parents = (

3725

delta_both_parents = (

3727

forcedeltabothparents or old_delta_config.delta_both_parents

3726

forcedeltabothparents or old_delta_config.delta_both_parents

3728

)

3727

)

3729

destrevlog.delta_config.delta_both_parents = delta_both_parents

3728

destrevlog.delta_config.delta_both_parents = delta_both_parents

3730

3729

3731

with self.reading(), destrevlog._writing(tr):

3730

with self.reading(), destrevlog._writing(tr):

3732

self._clone(

3731

self._clone(

3733

tr,

3732

tr,

3734

destrevlog,

3733

destrevlog,

3735

addrevisioncb,

3734

addrevisioncb,

3736

deltareuse,

3735

deltareuse,

3737

forcedeltabothparents,

3736

forcedeltabothparents,

3738

sidedata_helpers,

3737

sidedata_helpers,

3739

)

3738

)

3740

3739

3741

finally:

3740

finally:

3742

destrevlog.delta_config = old_delta_config

3741

destrevlog.delta_config = old_delta_config

3743

3742

3744

def _clone(

3743

def _clone(

3745

self,

3744

self,

3746

tr,

3745

tr,

3747

destrevlog,

3746

destrevlog,

3748

addrevisioncb,

3747

addrevisioncb,

3749

deltareuse,

3748

deltareuse,

3750

forcedeltabothparents,

3749

forcedeltabothparents,

3751

sidedata_helpers,

3750

sidedata_helpers,

3752

):

3751

):

3753

"""perform the core duty of `revlog.clone` after parameter processing"""

3752

"""perform the core duty of `revlog.clone` after parameter processing"""

3754

write_debug = None

3753

write_debug = None

3755

if self.delta_config.debug_delta:

3754

if self.delta_config.debug_delta:

3756

write_debug = tr._report

3755

write_debug = tr._report

3757

deltacomputer = deltautil.deltacomputer(

3756

deltacomputer = deltautil.deltacomputer(

3758

destrevlog,

3757

destrevlog,

3759

write_debug=write_debug,

3758

write_debug=write_debug,

3760

)

3759

)

3761

index = self.index

3760

index = self.index

3762

for rev in self:

3761

for rev in self:

3763

entry = index[rev]

3762

entry = index[rev]

3764

3763

3765

# Some classes override linkrev to take filtered revs into

3764

# Some classes override linkrev to take filtered revs into

3766

# account. Use raw entry from index.

3765

# account. Use raw entry from index.

3767

flags = entry[0] & 0xFFFF

3766

flags = entry[0] & 0xFFFF

3768

linkrev = entry[4]

3767

linkrev = entry[4]

3769

p1 = index[entry[5]][7]

3768

p1 = index[entry[5]][7]

3770

p2 = index[entry[6]][7]

3769

p2 = index[entry[6]][7]

3771

node = entry[7]

3770

node = entry[7]

3772

3771

3773

# (Possibly) reuse the delta from the revlog if allowed and

3772

# (Possibly) reuse the delta from the revlog if allowed and

3774

# the revlog chunk is a delta.

3773

# the revlog chunk is a delta.

3775

cachedelta = None

3774

cachedelta = None

3776

rawtext = None

3775

rawtext = None

3777

if deltareuse == self.DELTAREUSEFULLADD:

3776

if deltareuse == self.DELTAREUSEFULLADD:

3778

text = self._revisiondata(rev)

3777

text = self._revisiondata(rev)

3779

sidedata = self.sidedata(rev)

3778

sidedata = self.sidedata(rev)

3780

3779

3781

if sidedata_helpers is not None:

3780

if sidedata_helpers is not None:

3782

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3781

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3783

self, sidedata_helpers, sidedata, rev

3782

self, sidedata_helpers, sidedata, rev

3784

)

3783

)

3785

flags = flags | new_flags[0] & ~new_flags[1]

3784

flags = flags | new_flags[0] & ~new_flags[1]

3786

3785

3787

destrevlog.addrevision(

3786

destrevlog.addrevision(

3788

text,

3787

text,

3789

tr,

3788

tr,

3790

linkrev,

3789

linkrev,

3791

p1,

3790

p1,

3792

p2,

3791

p2,

3793

cachedelta=cachedelta,

3792

cachedelta=cachedelta,

3794

node=node,

3793

node=node,

3795

flags=flags,

3794

flags=flags,

3796

deltacomputer=deltacomputer,

3795

deltacomputer=deltacomputer,

3797

sidedata=sidedata,

3796

sidedata=sidedata,

3798

)

3797

)

3799

else:

3798

else:

3800

if destrevlog.delta_config.lazy_delta:

3799

if destrevlog.delta_config.lazy_delta:

3801

dp = self.deltaparent(rev)

3800

dp = self.deltaparent(rev)

3802

if dp != nullrev:

3801

if dp != nullrev:

3803

cachedelta = (dp, bytes(self._inner._chunk(rev)))

3802

cachedelta = (dp, bytes(self._inner._chunk(rev)))

3804

3803

3805

sidedata = None

3804

sidedata = None

3806

if not cachedelta:

3805

if not cachedelta:

3807

try:

3806

try:

3808

rawtext = self._revisiondata(rev)

3807

rawtext = self._revisiondata(rev)

3809

except error.CensoredNodeError as censored:

3808

except error.CensoredNodeError as censored:

3810

assert flags & REVIDX_ISCENSORED

3809

assert flags & REVIDX_ISCENSORED

3811

rawtext = censored.tombstone

3810

rawtext = censored.tombstone

3812

sidedata = self.sidedata(rev)

3811

sidedata = self.sidedata(rev)

3813

if sidedata is None:

3812

if sidedata is None:

3814

sidedata = self.sidedata(rev)

3813

sidedata = self.sidedata(rev)

3815

3814

3816

if sidedata_helpers is not None:

3815

if sidedata_helpers is not None:

3817

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3816

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3818

self, sidedata_helpers, sidedata, rev

3817

self, sidedata_helpers, sidedata, rev

3819

)

3818

)

3820

flags = flags | new_flags[0] & ~new_flags[1]

3819

flags = flags | new_flags[0] & ~new_flags[1]

3821

3820

3822

destrevlog._addrevision(

3821

destrevlog._addrevision(

3823

node,

3822

node,

3824

rawtext,

3823

rawtext,

3825

tr,

3824

tr,

3826

linkrev,

3825

linkrev,

3827

p1,

3826

p1,

3828

p2,

3827

p2,

3829

flags,

3828

flags,

3830

cachedelta,

3829

cachedelta,

3831

deltacomputer=deltacomputer,

3830

deltacomputer=deltacomputer,

3832

sidedata=sidedata,

3831

sidedata=sidedata,

3833

)

3832

)

3834

3833

3835

if addrevisioncb:

3834

if addrevisioncb:

3836

addrevisioncb(self, rev, node)

3835

addrevisioncb(self, rev, node)

3837

3836

3838

def censorrevision(self, tr, censor_nodes, tombstone=b''):

3837

def censorrevision(self, tr, censor_nodes, tombstone=b''):

3839

if self._format_version == REVLOGV0:

3838

if self._format_version == REVLOGV0:

3840

raise error.RevlogError(

3839

raise error.RevlogError(

3841

_(b'cannot censor with version %d revlogs')

3840

_(b'cannot censor with version %d revlogs')

3842

% self._format_version

3841

% self._format_version

3843

)

3842

)

3844

elif self._format_version == REVLOGV1:

3843

elif self._format_version == REVLOGV1:

3845

rewrite.v1_censor(self, tr, censor_nodes, tombstone)

3844

rewrite.v1_censor(self, tr, censor_nodes, tombstone)

3846

else:

3845

else:

3847

rewrite.v2_censor(self, tr, censor_nodes, tombstone)

3846

rewrite.v2_censor(self, tr, censor_nodes, tombstone)

3848

3847

3849

def verifyintegrity(self, state):

3848

def verifyintegrity(self, state):

3850

"""Verifies the integrity of the revlog.

3849

"""Verifies the integrity of the revlog.

3851

3850

3852

Yields ``revlogproblem`` instances describing problems that are

3851

Yields ``revlogproblem`` instances describing problems that are

3853

found.

3852

found.

3854

"""

3853

"""

3855

dd, di = self.checksize()

3854

dd, di = self.checksize()

3856

if dd:

3855

if dd:

3857

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3856

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3858

if di:

3857

if di:

3859

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3858

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3860

3859

3861

version = self._format_version

3860

version = self._format_version

3862

3861

3863

# The verifier tells us what version revlog we should be.

3862

# The verifier tells us what version revlog we should be.

3864

if version != state[b'expectedversion']:

3863

if version != state[b'expectedversion']:

3865

yield revlogproblem(

3864

yield revlogproblem(

3866

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3865

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3867

% (self.display_id, version, state[b'expectedversion'])

3866

% (self.display_id, version, state[b'expectedversion'])

3868

)

3867

)

3869

3868

3870

state[b'skipread'] = set()

3869

state[b'skipread'] = set()

3871

state[b'safe_renamed'] = set()

3870

state[b'safe_renamed'] = set()

3872

3871

3873

for rev in self:

3872

for rev in self:

3874

node = self.node(rev)

3873

node = self.node(rev)

3875

3874

3876

# Verify contents. 4 cases to care about:

3875

# Verify contents. 4 cases to care about:

3877

#

3876

#

3878

# common: the most common case

3877

# common: the most common case

3879

# rename: with a rename

3878

# rename: with a rename

3880

# meta: file content starts with b'\1\n', the metadata

3879

# meta: file content starts with b'\1\n', the metadata

3881

# header defined in filelog.py, but without a rename

3880

# header defined in filelog.py, but without a rename

3882

# ext: content stored externally

3881

# ext: content stored externally

3883

#

3882

#

3884

# More formally, their differences are shown below:

3883

# More formally, their differences are shown below:

3885

#

3884

#

3886

# | common | rename | meta | ext

3885

# | common | rename | meta | ext

3887

# -------------------------------------------------------

3886

# -------------------------------------------------------

3888

# flags() | 0 | 0 | 0 | not 0

3887

# flags() | 0 | 0 | 0 | not 0

3889

# renamed() | False | True | False | ?

3888

# renamed() | False | True | False | ?

3890

# rawtext[0:2]=='\1\n'| False | True | True | ?

3889

# rawtext[0:2]=='\1\n'| False | True | True | ?

3891

#

3890

#

3892

# "rawtext" means the raw text stored in revlog data, which

3891

# "rawtext" means the raw text stored in revlog data, which

3893

# could be retrieved by "rawdata(rev)". "text"

3892

# could be retrieved by "rawdata(rev)". "text"

3894

# mentioned below is "revision(rev)".

3893

# mentioned below is "revision(rev)".

3895

#

3894

#

3896

# There are 3 different lengths stored physically:

3895

# There are 3 different lengths stored physically:

3897

# 1. L1: rawsize, stored in revlog index

3896

# 1. L1: rawsize, stored in revlog index

3898

# 2. L2: len(rawtext), stored in revlog data

3897

# 2. L2: len(rawtext), stored in revlog data

3899

# 3. L3: len(text), stored in revlog data if flags==0, or

3898

# 3. L3: len(text), stored in revlog data if flags==0, or

3900

# possibly somewhere else if flags!=0

3899

# possibly somewhere else if flags!=0

3901

#

3900

#

3902

# L1 should be equal to L2. L3 could be different from them.

3901

# L1 should be equal to L2. L3 could be different from them.

3903

# "text" may or may not affect commit hash depending on flag

3902

# "text" may or may not affect commit hash depending on flag

3904

# processors (see flagutil.addflagprocessor).

3903

# processors (see flagutil.addflagprocessor).

3905

#

3904

#

3906

# | common | rename | meta | ext

3905

# | common | rename | meta | ext

3907

# -------------------------------------------------

3906

# -------------------------------------------------

3908

# rawsize() | L1 | L1 | L1 | L1

3907

# rawsize() | L1 | L1 | L1 | L1

3909

# size() | L1 | L2-LM | L1(*) | L1 (?)

3908

# size() | L1 | L2-LM | L1(*) | L1 (?)

3910

# len(rawtext) | L2 | L2 | L2 | L2

3909

# len(rawtext) | L2 | L2 | L2 | L2

3911

# len(text) | L2 | L2 | L2 | L3

3910

# len(text) | L2 | L2 | L2 | L3

3912

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3911

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3913

#

3912

#

3914

# LM: length of metadata, depending on rawtext

3913

# LM: length of metadata, depending on rawtext

3915

# (*): not ideal, see comment in filelog.size

3914

# (*): not ideal, see comment in filelog.size

3916

# (?): could be "- len(meta)" if the resolved content has

3915

# (?): could be "- len(meta)" if the resolved content has

3917

# rename metadata

3916

# rename metadata

3918

#

3917

#

3919

# Checks needed to be done:

3918

# Checks needed to be done:

3920

# 1. length check: L1 == L2, in all cases.

3919

# 1. length check: L1 == L2, in all cases.

3921

# 2. hash check: depending on flag processor, we may need to

3920

# 2. hash check: depending on flag processor, we may need to

3922

# use either "text" (external), or "rawtext" (in revlog).

3921

# use either "text" (external), or "rawtext" (in revlog).

3923

3922

3924

try:

3923

try:

3925

skipflags = state.get(b'skipflags', 0)

3924

skipflags = state.get(b'skipflags', 0)

3926

if skipflags:

3925

if skipflags:

3927

skipflags &= self.flags(rev)

3926

skipflags &= self.flags(rev)

3928

3927

3929

_verify_revision(self, skipflags, state, node)

3928

_verify_revision(self, skipflags, state, node)

3930

3929

3931

l1 = self.rawsize(rev)

3930

l1 = self.rawsize(rev)

3932

l2 = len(self.rawdata(node))

3931

l2 = len(self.rawdata(node))

3933

3932

3934

if l1 != l2:

3933

if l1 != l2:

3935

yield revlogproblem(

3934

yield revlogproblem(

3936

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3935

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3937

node=node,

3936

node=node,

3938

)

3937

)

3939

3938

3940

except error.CensoredNodeError:

3939

except error.CensoredNodeError:

3941

if state[b'erroroncensored']:

3940

if state[b'erroroncensored']:

3942

yield revlogproblem(

3941

yield revlogproblem(

3943

error=_(b'censored file data'), node=node

3942

error=_(b'censored file data'), node=node

3944

)

3943

)

3945

state[b'skipread'].add(node)

3944

state[b'skipread'].add(node)

3946

except Exception as e:

3945

except Exception as e:

3947

yield revlogproblem(

3946

yield revlogproblem(

3948

error=_(b'unpacking %s: %s')

3947

error=_(b'unpacking %s: %s')

3949

% (short(node), stringutil.forcebytestr(e)),

3948

% (short(node), stringutil.forcebytestr(e)),

3950

node=node,

3949

node=node,

3951

)

3950

)

3952

state[b'skipread'].add(node)

3951

state[b'skipread'].add(node)

3953

3952

3954

def storageinfo(

3953

def storageinfo(

3955

self,

3954

self,

3956

exclusivefiles=False,

3955

exclusivefiles=False,

3957

sharedfiles=False,

3956

sharedfiles=False,

3958

revisionscount=False,

3957

revisionscount=False,

3959

trackedsize=False,

3958

trackedsize=False,

3960

storedsize=False,

3959

storedsize=False,

3961

):

3960

):

3962

d = {}

3961

d = {}

3963

3962

3964

if exclusivefiles:

3963

if exclusivefiles:

3965

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3964

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3966

if not self._inline:

3965

if not self._inline:

3967

d[b'exclusivefiles'].append((self.opener, self._datafile))

3966

d[b'exclusivefiles'].append((self.opener, self._datafile))

3968

3967

3969

if sharedfiles:

3968

if sharedfiles:

3970

d[b'sharedfiles'] = []

3969

d[b'sharedfiles'] = []

3971

3970

3972

if revisionscount:

3971

if revisionscount:

3973

d[b'revisionscount'] = len(self)

3972

d[b'revisionscount'] = len(self)

3974

3973

3975

if trackedsize:

3974

if trackedsize:

3976

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3975

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3977

3976

3978

if storedsize:

3977

if storedsize:

3979

d[b'storedsize'] = sum(

3978

d[b'storedsize'] = sum(

3980

self.opener.stat(path).st_size for path in self.files()

3979

self.opener.stat(path).st_size for path in self.files()

3981

)

3980

)

3982

3981

3983

return d

3982

return d

3984

3983

3985

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3984

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3986

if not self.feature_config.has_side_data:

3985

if not self.feature_config.has_side_data:

3987

return

3986

return

3988

# revlog formats with sidedata support does not support inline

3987

# revlog formats with sidedata support does not support inline

3989

assert not self._inline

3988

assert not self._inline

3990

if not helpers[1] and not helpers[2]:

3989

if not helpers[1] and not helpers[2]:

3991

# Nothing to generate or remove

3990

# Nothing to generate or remove

3992

return

3991

return

3993

3992

3994

new_entries = []

3993

new_entries = []

3995

# append the new sidedata

3994

# append the new sidedata

3996

with self._writing(transaction):

3995

with self._writing(transaction):

3997

ifh, dfh, sdfh = self._inner._writinghandles

3996

ifh, dfh, sdfh = self._inner._writinghandles

3998

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3997

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3999

3998

4000

current_offset = sdfh.tell()

3999

current_offset = sdfh.tell()

4001

for rev in range(startrev, endrev + 1):

4000

for rev in range(startrev, endrev + 1):

4002

entry = self.index[rev]

4001

entry = self.index[rev]

4003

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

4002

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

4004

store=self,

4003

store=self,

4005

sidedata_helpers=helpers,

4004

sidedata_helpers=helpers,

4006

sidedata={},

4005

sidedata={},

4007

rev=rev,

4006

rev=rev,

4008

)

4007

)

4009

4008

4010

serialized_sidedata = sidedatautil.serialize_sidedata(

4009

serialized_sidedata = sidedatautil.serialize_sidedata(

4011

new_sidedata

4010

new_sidedata

4012

)

4011

)

4013

4012

4014

sidedata_compression_mode = COMP_MODE_INLINE

4013

sidedata_compression_mode = COMP_MODE_INLINE

4015

if serialized_sidedata and self.feature_config.has_side_data:

4014

if serialized_sidedata and self.feature_config.has_side_data:

4016

sidedata_compression_mode = COMP_MODE_PLAIN

4015

sidedata_compression_mode = COMP_MODE_PLAIN

4017

h, comp_sidedata = self._inner.compress(serialized_sidedata)

4016

h, comp_sidedata = self._inner.compress(serialized_sidedata)

4018

if (

4017

if (

4019

h != b'u'

4018

h != b'u'

4020

and comp_sidedata[0] != b'\0'

4019

and comp_sidedata[0] != b'\0'

4021

and len(comp_sidedata) < len(serialized_sidedata)

4020

and len(comp_sidedata) < len(serialized_sidedata)

4022

):

4021

):

4023

assert not h

4022

assert not h

4024

if (

4023

if (

4025

comp_sidedata[0]

4024

comp_sidedata[0]

4026

== self._docket.default_compression_header

4025

== self._docket.default_compression_header

4027

):

4026

):

4028

sidedata_compression_mode = COMP_MODE_DEFAULT

4027

sidedata_compression_mode = COMP_MODE_DEFAULT

4029

serialized_sidedata = comp_sidedata

4028

serialized_sidedata = comp_sidedata

4030

else:

4029

else:

4031

sidedata_compression_mode = COMP_MODE_INLINE

4030

sidedata_compression_mode = COMP_MODE_INLINE

4032

serialized_sidedata = comp_sidedata

4031

serialized_sidedata = comp_sidedata

4033

if entry[8] != 0 or entry[9] != 0:

4032

if entry[8] != 0 or entry[9] != 0:

4034

# rewriting entries that already have sidedata is not

4033

# rewriting entries that already have sidedata is not

4035

# supported yet, because it introduces garbage data in the

4034

# supported yet, because it introduces garbage data in the

4036

# revlog.

4035

# revlog.

4037

msg = b"rewriting existing sidedata is not supported yet"

4036

msg = b"rewriting existing sidedata is not supported yet"

4038

raise error.Abort(msg)

4037

raise error.Abort(msg)

4039

4038

4040

# Apply (potential) flags to add and to remove after running

4039

# Apply (potential) flags to add and to remove after running

4041

# the sidedata helpers

4040

# the sidedata helpers

4042

new_offset_flags = entry[0] | flags[0] & ~flags[1]

4041

new_offset_flags = entry[0] | flags[0] & ~flags[1]

4043

entry_update = (

4042

entry_update = (

4044

current_offset,

4043

current_offset,

4045

len(serialized_sidedata),

4044

len(serialized_sidedata),

4046

new_offset_flags,

4045

new_offset_flags,

4047

sidedata_compression_mode,

4046

sidedata_compression_mode,

4048

)

4047

)

4049

4048

4050

# the sidedata computation might have move the file cursors around

4049

# the sidedata computation might have move the file cursors around

4051

sdfh.seek(current_offset, os.SEEK_SET)

4050

sdfh.seek(current_offset, os.SEEK_SET)

4052

sdfh.write(serialized_sidedata)

4051

sdfh.write(serialized_sidedata)

4053

new_entries.append(entry_update)

4052

new_entries.append(entry_update)

4054

current_offset += len(serialized_sidedata)

4053

current_offset += len(serialized_sidedata)

4055

self._docket.sidedata_end = sdfh.tell()

4054

self._docket.sidedata_end = sdfh.tell()

4056

4055

4057

# rewrite the new index entries

4056

# rewrite the new index entries

4058

ifh.seek(startrev * self.index.entry_size)

4057

ifh.seek(startrev * self.index.entry_size)

4059

for i, e in enumerate(new_entries):

4058

for i, e in enumerate(new_entries):

4060

rev = startrev + i

4059

rev = startrev + i

4061

self.index.replace_sidedata_info(rev, *e)

4060

self.index.replace_sidedata_info(rev, *e)

4062

packed = self.index.entry_binary(rev)

4061

packed = self.index.entry_binary(rev)

4063

if rev == 0 and self._docket is None:

4062

if rev == 0 and self._docket is None:

4064

header = self._format_flags | self._format_version

4063

header = self._format_flags | self._format_version

4065

header = self.index.pack_header(header)

4064

header = self.index.pack_header(header)

4066

packed = header + packed

4065

packed = header + packed

4067

ifh.write(packed)

4066

ifh.write(packed)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # changelog.py - changelog class for mercurial
             #
             # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from .i18n import _
             from .node import (
                 bin,
                 hex,
             )
             from .thirdparty import attr
             from . import (
                 encoding,
                 error,
                 metadata,
                 pycompat,
                 revlog,
             )
             from .utils import (
                 dateutil,
                 stringutil,
             )
             from .revlogutils import (
                 constants as revlog_constants,
                 flagutil,
             )
             _defaultextra = {b'branch': b'default'}
             def _string_escape(text):
                 """
                 >>> from .pycompat import bytechr as chr
                 >>> d = {b'nl': chr(10), b'bs': chr(92), b'cr': chr(13), b'nul': chr(0)}
                 >>> s = b"ab%(nl)scd%(bs)s%(bs)sn%(nul)s12ab%(cr)scd%(bs)s%(nl)s" % d
                 >>> s
                 'ab\\ncd\\\\\\\\n\\x0012ab\\rcd\\\\\\n'
                 >>> res = _string_escape(s)
                 >>> s == _string_unescape(res)
                 True
                 """
                 # subset of the string_escape codec
                 text = (
                     text.replace(b'\\', b'\\\\')
                     .replace(b'\n', b'\\n')
                     .replace(b'\r', b'\\r')
                 )
                 return text.replace(b'\0', b'\\0')
             def _string_unescape(text):
                 if b'\\0' in text:
                     # fix up \0 without getting into trouble with \\0
                     text = text.replace(b'\\\\', b'\\\\\n')
                     text = text.replace(b'\\0', b'\0')
                     text = text.replace(b'\n', b'')
                 return stringutil.unescapestr(text)
             def decodeextra(text):
                 """
                 >>> from .pycompat import bytechr as chr
                 >>> sorted(decodeextra(encodeextra({b'foo': b'bar', b'baz': chr(0) + b'2'})
                 ...                    ).items())
                 [('baz', '\\x002'), ('branch', 'default'), ('foo', 'bar')]
                 >>> sorted(decodeextra(encodeextra({b'foo': b'bar',
                 ...                                 b'baz': chr(92) + chr(0) + b'2'})
                 ...                    ).items())
                 [('baz', '\\\\\\x002'), ('branch', 'default'), ('foo', 'bar')]
                 """
                 extra = _defaultextra.copy()
                 for l in text.split(b'\0'):
                     if l:
                         k, v = _string_unescape(l).split(b':', 1)
                         extra[k] = v
                 return extra
             def encodeextra(d):
                 # keys must be sorted to produce a deterministic changelog entry
                 items = [_string_escape(b'%s:%s' % (k, d[k])) for k in sorted(d)]
                 return b"\0".join(items)
             def stripdesc(desc):
                 """strip trailing whitespace and leading and trailing empty lines"""
                 return b'\n'.join([l.rstrip() for l in desc.splitlines()]).strip(b'\n')
             @attr.s
             class _changelogrevision:
                 # Extensions might modify _defaultextra, so let the constructor below pass
                 # it in
                 extra = attr.ib()
                 manifest = attr.ib()
                 user = attr.ib(default=b'')
                 date = attr.ib(default=(0, 0))
                 files = attr.ib(default=attr.Factory(list))
                 filesadded = attr.ib(default=None)
                 filesremoved = attr.ib(default=None)
                 p1copies = attr.ib(default=None)
                 p2copies = attr.ib(default=None)
                 description = attr.ib(default=b'')
                 branchinfo = attr.ib(default=(_defaultextra[b'branch'], False))
             class changelogrevision:
                 """Holds results of a parsed changelog revision.
                 Changelog revisions consist of multiple pieces of data, including
                 the manifest node, user, and date. This object exposes a view into
                 the parsed object.
                 """
                 __slots__ = (
                     '_offsets',
                     '_text',
                     '_sidedata',
                     '_cpsd',
                     '_changes',
                 )
                 def __new__(cls, cl, text, sidedata, cpsd):
                     if not text:
                         return _changelogrevision(extra=_defaultextra, manifest=cl.nullid)
                     self = super(changelogrevision, cls).__new__(cls)
                     # We could return here and implement the following as an __init__.
                     # But doing it here is equivalent and saves an extra function call.
                     # format used:
                     # nodeid\n        : manifest node in ascii
                     # user\n          : user, no \n or \r allowed
                     # time tz extra\n : date (time is int or float, timezone is int)
                     #                 : extra is metadata, encoded and separated by '\0'
                     #                 : older versions ignore it
                     # files\n\n       : files modified by the cset, no \n or \r allowed
                     # (.*)            : comment (free text, ideally utf-8)
                     #
                     # changelog v0 doesn't use extra
                     nl1 = text.index(b'\n')
                     nl2 = text.index(b'\n', nl1 + 1)
                     nl3 = text.index(b'\n', nl2 + 1)
                     # The list of files may be empty. Which means nl3 is the first of the
                     # double newline that precedes the description.
                     if text[nl3 + 1 : nl3 + 2] == b'\n':
                         doublenl = nl3
                     else:
                         doublenl = text.index(b'\n\n', nl3 + 1)
                     self._offsets = (nl1, nl2, nl3, doublenl)
                     self._text = text
                     self._sidedata = sidedata
                     self._cpsd = cpsd
                     self._changes = None
                     return self
                 @property
                 def manifest(self):
                     return bin(self._text[0 : self._offsets[0]])
                 @property
                 def user(self):
                     off = self._offsets
                     return encoding.tolocal(self._text[off[0] + 1 : off[1]])
                 @property
                 def _rawdate(self):
                     off = self._offsets
                     dateextra = self._text[off[1] + 1 : off[2]]
                     return dateextra.split(b' ', 2)[0:2]
                 @property
                 def _rawextra(self):
                     off = self._offsets
                     dateextra = self._text[off[1] + 1 : off[2]]
                     fields = dateextra.split(b' ', 2)
                     if len(fields) != 3:
                         return None
                     return fields[2]
                 @property
                 def date(self):
                     raw = self._rawdate
                     time = float(raw[0])
                     # Various tools did silly things with the timezone.
                     try:
                         timezone = int(raw[1])
                     except ValueError:
                         timezone = 0
                     return time, timezone
                 @property
                 def extra(self):
                     raw = self._rawextra
                     if raw is None:
                         return _defaultextra
                     return decodeextra(raw)
                 @property
                 def changes(self):
                     if self._changes is not None:
                         return self._changes
                     if self._cpsd:
                         changes = metadata.decode_files_sidedata(self._sidedata)
                     else:
                         changes = metadata.ChangingFiles(
                             touched=self.files or (),
                             added=self.filesadded or (),
                             removed=self.filesremoved or (),
                             p1_copies=self.p1copies or {},
                             p2_copies=self.p2copies or {},
                         )
                     self._changes = changes
                     return changes
                 @property
                 def files(self):
                     if self._cpsd:
                         return sorted(self.changes.touched)
                     off = self._offsets
                     if off[2] == off[3]:
                         return []
                     return self._text[off[2] + 1 : off[3]].split(b'\n')
                 @property
                 def filesadded(self):
                     if self._cpsd:
                         return self.changes.added
                     else:
                         rawindices = self.extra.get(b'filesadded')
                     if rawindices is None:
                         return None
                     return metadata.decodefileindices(self.files, rawindices)
                 @property
                 def filesremoved(self):
                     if self._cpsd:
                         return self.changes.removed
                     else:
                         rawindices = self.extra.get(b'filesremoved')
                     if rawindices is None:
                         return None
                     return metadata.decodefileindices(self.files, rawindices)
                 @property
                 def p1copies(self):
                     if self._cpsd:
                         return self.changes.copied_from_p1
                     else:
                         rawcopies = self.extra.get(b'p1copies')
                     if rawcopies is None:
                         return None
                     return metadata.decodecopies(self.files, rawcopies)
                 @property
                 def p2copies(self):
                     if self._cpsd:
                         return self.changes.copied_from_p2
                     else:
                         rawcopies = self.extra.get(b'p2copies')
                     if rawcopies is None:
                         return None
                     return metadata.decodecopies(self.files, rawcopies)
                 @property
                 def description(self):
                     return encoding.tolocal(self._text[self._offsets[3] + 2 :])
                 @property
                 def branchinfo(self):
                     extra = self.extra
                     return encoding.tolocal(extra.get(b"branch")), b'close' in extra
             class changelog(revlog.revlog):
                 def __init__(self, opener, trypending=False, concurrencychecker=None):
                     """Load a changelog revlog using an opener.
                     If ``trypending`` is true, we attempt to load the index from a
                     ``00changelog.i.a`` file instead of the default ``00changelog.i``.
                     The ``00changelog.i.a`` file contains index (and possibly inline
                     revision) data for a transaction that hasn't been finalized yet.
                     It exists in a separate file to facilitate readers (such as
                     hooks processes) accessing data before a transaction is finalized.
                     ``concurrencychecker`` will be passed to the revlog init function, see
                     the documentation there.
                     """
                     revlog.revlog.__init__(
                         self,
                         opener,
                         target=(revlog_constants.KIND_CHANGELOG, None),
                         radix=b'00changelog',
                         checkambig=True,
                         mmaplargeindex=True,
                         persistentnodemap=opener.options.get(b'persistent-nodemap', False),
                         concurrencychecker=concurrencychecker,
                         trypending=trypending,
                         may_inline=False,
                     )
                     if self._initempty and (self._format_version == revlog.REVLOGV1):
                         # changelogs don't benefit from generaldelta.
                         self._format_flags &= ~revlog.FLAG_GENERALDELTA
                         self.delta_config.general_delta = False
                     # Delta chains for changelogs tend to be very small because entries
                     # tend to be small and don't delta well with each. So disable delta
                     # chains.
                     self._storedeltachains = False
                     self._v2_delayed = False
                     self._filteredrevs = frozenset()
                     self._filteredrevs_hashcache = {}
                     self._copiesstorage = opener.options.get(b'copies-storage')
                 @property
                 def filteredrevs(self):
                     return self._filteredrevs
                 @filteredrevs.setter
                 def filteredrevs(self, val):
                     # Ensure all updates go through this function
                     assert isinstance(val, frozenset)
                     self._filteredrevs = val
                     self._filteredrevs_hashcache = {}
                 def _write_docket(self, tr):
                     if not self._v2_delayed:
                         super(changelog, self)._write_docket(tr)
                 def delayupdate(self, tr):
                     """delay visibility of index updates to other readers"""
                     assert not self._inner.is_open
                     assert not self._may_inline
                     # enforce that older changelog that are still inline are split at the
                     # first opportunity.
                     if self._inline:
                         self._enforceinlinesize(tr)
                     if self._docket is not None:
                         self._v2_delayed = True
                     else:
                         new_index = self._inner.delay()
                         if new_index is not None:
                             self._indexfile = new_index
                             tr.registertmp(new_index)
                     tr.addpending(b'cl-%i' % id(self), self._writepending)
                     tr.addfinalize(b'cl-%i' % id(self), self._finalize)
                 def _finalize(self, tr):
                     """finalize index updates"""
                     assert not self._inner.is_open
                     if self._docket is not None:
                         self._docket.write(tr)
                         self._v2_delayed = False
                     else:
                         new_index_file = self._inner.finalize_pending()
                         self._indexfile = new_index_file
                         if self._inline:
                             msg = 'changelog should not be inline at that point'
                             raise error.ProgrammingError(msg)
                 def _writepending(self, tr):
                     """create a file containing the unfinalized state for
                     pretxnchangegroup"""
                     assert not self._inner.is_open
                     if self._docket:
                         any_pending = self._docket.write(tr, pending=True)
                         self._v2_delayed = False
                     else:
                         new_index, any_pending = self._inner.write_pending()
                         if new_index is not None:
                             self._indexfile = new_index
                             tr.registertmp(new_index)
                     return any_pending
-                def _enforceinlinesize(self, tr, side_write=True):
+                def _enforceinlinesize(self, tr):
                     if not self.is_delaying:
-                        revlog.revlog._enforceinlinesize(self, tr, side_write=side_write)
+                        revlog.revlog._enforceinlinesize(self, tr)
                 def read(self, nodeorrev):
                     """Obtain data from a parsed changelog revision.
                     Returns a 6-tuple of:
                        - manifest node in binary
                        - author/user as a localstr
                        - date as a 2-tuple of (time, timezone)
                        - list of files
                        - commit message as a localstr
                        - dict of extra metadata
                     Unless you need to access all fields, consider calling
                     ``changelogrevision`` instead, as it is faster for partial object
                     access.
                     """
                     d = self._revisiondata(nodeorrev)
                     sidedata = self.sidedata(nodeorrev)
                     copy_sd = self._copiesstorage == b'changeset-sidedata'
                     c = changelogrevision(self, d, sidedata, copy_sd)
                     return (c.manifest, c.user, c.date, c.files, c.description, c.extra)
                 def changelogrevision(self, nodeorrev):
                     """Obtain a ``changelogrevision`` for a node or revision."""
                     text = self._revisiondata(nodeorrev)
                     sidedata = self.sidedata(nodeorrev)
                     return changelogrevision(
                         self, text, sidedata, self._copiesstorage == b'changeset-sidedata'
                     )
                 def readfiles(self, nodeorrev):
                     """
                     short version of read that only returns the files modified by the cset
                     """
                     text = self.revision(nodeorrev)
                     if not text:
                         return []
                     last = text.index(b"\n\n")
                     l = text[:last].split(b'\n')
                     return l[3:]
                 def add(
                     self,
                     manifest,
                     files,
                     desc,
                     transaction,
                     p1,
                     p2,
                     user,
                     date=None,
                     extra=None,
                 ):
                     # Convert to UTF-8 encoded bytestrings as the very first
                     # thing: calling any method on a localstr object will turn it
                     # into a str object and the cached UTF-8 string is thus lost.
                     user, desc = encoding.fromlocal(user), encoding.fromlocal(desc)
                     user = user.strip()
                     # An empty username or a username with a "\n" will make the
                     # revision text contain two "\n\n" sequences -> corrupt
                     # repository since read cannot unpack the revision.
                     if not user:
                         raise error.StorageError(_(b"empty username"))
                     if b"\n" in user:
                         raise error.StorageError(
                             _(b"username %r contains a newline") % pycompat.bytestr(user)
                         )
                     desc = stripdesc(desc)
                     if date:
                         parseddate = b"%d %d" % dateutil.parsedate(date)
                     else:
                         parseddate = b"%d %d" % dateutil.makedate()
                     if extra:
                         branch = extra.get(b"branch")
                         if branch in (b"default", b""):
                             del extra[b"branch"]
                         elif branch in (b".", b"null", b"tip"):
                             raise error.StorageError(
                                 _(b'the name \'%s\' is reserved') % branch
                             )
                     sortedfiles = sorted(files.touched)
                     flags = 0
                     sidedata = None
                     if self._copiesstorage == b'changeset-sidedata':
                         if files.has_copies_info:
                             flags |= flagutil.REVIDX_HASCOPIESINFO
                         sidedata = metadata.encode_files_sidedata(files)
                     if extra:
                         extra = encodeextra(extra)
                         parseddate = b"%s %s" % (parseddate, extra)
                     l = [hex(manifest), user, parseddate] + sortedfiles + [b"", desc]
                     text = b"\n".join(l)
                     rev = self.addrevision(
                         text, transaction, len(self), p1, p2, sidedata=sidedata, flags=flags
                     )
                     return self.node(rev)
                 def branchinfo(self, rev):
                     """return the branch name and open/close state of a revision
                     This function exists because creating a changectx object
                     just to access this is costly."""
                     return self.changelogrevision(rev).branchinfo
                 def _nodeduplicatecallback(self, transaction, rev):
                     # keep track of revisions that got "re-added", eg: unbunde of know rev.
                     #
                     # We track them in a list to preserve their order from the source bundle
                     duplicates = transaction.changes.setdefault(b'revduplicates', [])
                     duplicates.append(rev)

             # revlog.py - storage back-end for mercurial
             # coding: utf8
             #
             # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             import binascii
             import collections
             import contextlib
             import functools
             import io
             import os
             import struct
             import weakref
             import zlib
             # import stuff from node for others to import from revlog
             from .node import (
                 bin,
                 hex,
                 nullrev,
                 sha1nodeconstants,
                 short,
                 wdirrev,
             )
             from .i18n import _
             from .revlogutils.constants import (
                 ALL_KINDS,
                 CHANGELOGV2,
                 COMP_MODE_DEFAULT,
                 COMP_MODE_INLINE,
                 COMP_MODE_PLAIN,
                 DELTA_BASE_REUSE_NO,
                 DELTA_BASE_REUSE_TRY,
                 ENTRY_RANK,
                 FEATURES_BY_VERSION,
                 FLAG_GENERALDELTA,
                 FLAG_INLINE_DATA,
                 INDEX_HEADER,
                 KIND_CHANGELOG,
                 KIND_FILELOG,
                 RANK_UNKNOWN,
                 REVLOGV0,
                 REVLOGV1,
                 REVLOGV1_FLAGS,
                 REVLOGV2,
                 REVLOGV2_FLAGS,
                 REVLOG_DEFAULT_FLAGS,
                 REVLOG_DEFAULT_FORMAT,
                 REVLOG_DEFAULT_VERSION,
                 SUPPORTED_FLAGS,
             )
             from .revlogutils.flagutil import (
                 REVIDX_DEFAULT_FLAGS,
                 REVIDX_ELLIPSIS,
                 REVIDX_EXTSTORED,
                 REVIDX_FLAGS_ORDER,
                 REVIDX_HASCOPIESINFO,
                 REVIDX_ISCENSORED,
                 REVIDX_RAWTEXT_CHANGING_FLAGS,
             )
             from .thirdparty import attr
             from . import (
                 ancestor,
                 dagop,
                 error,
                 mdiff,
                 policy,
                 pycompat,
                 revlogutils,
                 templatefilters,
                 util,
             )
             from .interfaces import (
                 repository,
                 util as interfaceutil,
             )
             from .revlogutils import (
                 deltas as deltautil,
                 docket as docketutil,
                 flagutil,
                 nodemap as nodemaputil,
                 randomaccessfile,
                 revlogv0,
                 rewrite,
                 sidedata as sidedatautil,
             )
             from .utils import (
                 storageutil,
                 stringutil,
             )
             # blanked usage of all the name to prevent pyflakes constraints
             # We need these name available in the module for extensions.
             REVLOGV0
             REVLOGV1
             REVLOGV2
             CHANGELOGV2
             FLAG_INLINE_DATA
             FLAG_GENERALDELTA
             REVLOG_DEFAULT_FLAGS
             REVLOG_DEFAULT_FORMAT
             REVLOG_DEFAULT_VERSION
             REVLOGV1_FLAGS
             REVLOGV2_FLAGS
             REVIDX_ISCENSORED
             REVIDX_ELLIPSIS
             REVIDX_HASCOPIESINFO
             REVIDX_EXTSTORED
             REVIDX_DEFAULT_FLAGS
             REVIDX_FLAGS_ORDER
             REVIDX_RAWTEXT_CHANGING_FLAGS
             parsers = policy.importmod('parsers')
             rustancestor = policy.importrust('ancestor')
             rustdagop = policy.importrust('dagop')
             rustrevlog = policy.importrust('revlog')
             # Aliased for performance.
             _zlibdecompress = zlib.decompress
             # max size of inline data embedded into a revlog
             _maxinline = 131072
             # Flag processors for REVIDX_ELLIPSIS.
             def ellipsisreadprocessor(rl, text):
                 return text, False
             def ellipsiswriteprocessor(rl, text):
                 return text, False
             def ellipsisrawprocessor(rl, text):
                 return False
             ellipsisprocessor = (
                 ellipsisreadprocessor,
                 ellipsiswriteprocessor,
                 ellipsisrawprocessor,
             )
             def _verify_revision(rl, skipflags, state, node):
                 """Verify the integrity of the given revlog ``node`` while providing a hook
                 point for extensions to influence the operation."""
                 if skipflags:
                     state[b'skipread'].add(node)
                 else:
                     # Side-effect: read content and verify hash.
                     rl.revision(node)
             # True if a fast implementation for persistent-nodemap is available
             #
             # We also consider we have a "fast" implementation in "pure" python because
             # people using pure don't really have performance consideration (and a
             # wheelbarrow of other slowness source)
             HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(
                 parsers, 'BaseIndexObject'
             )
             @interfaceutil.implementer(repository.irevisiondelta)
             @attr.s(slots=True)
             class revlogrevisiondelta:
                 node = attr.ib()
                 p1node = attr.ib()
                 p2node = attr.ib()
                 basenode = attr.ib()
                 flags = attr.ib()
                 baserevisionsize = attr.ib()
                 revision = attr.ib()
                 delta = attr.ib()
                 sidedata = attr.ib()
                 protocol_flags = attr.ib()
                 linknode = attr.ib(default=None)
             @interfaceutil.implementer(repository.iverifyproblem)
             @attr.s(frozen=True)
             class revlogproblem:
                 warning = attr.ib(default=None)
                 error = attr.ib(default=None)
                 node = attr.ib(default=None)
             def parse_index_v1(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline)
                 return index, cache
             def parse_index_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)
                 return index, cache
             def parse_index_cl_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)
                 return index, cache
             if hasattr(parsers, 'parse_index_devel_nodemap'):
                 def parse_index_v1_nodemap(data, inline):
                     index, cache = parsers.parse_index_devel_nodemap(data, inline)
                     return index, cache
             else:
                 parse_index_v1_nodemap = None
             def parse_index_v1_rust(data, inline, default_header):
                 cache = (0, data) if inline else None
                 return rustrevlog.Index(data, default_header), cache
             # corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
             # signed integer)
             _maxentrysize = 0x7FFFFFFF
             FILE_TOO_SHORT_MSG = _(
                 b'cannot read from revlog %s;'
                 b'  expected %d bytes from offset %d, data size is %d'
             )
             hexdigits = b'0123456789abcdefABCDEF'
             class _Config:
                 def copy(self):
                     return self.__class__(**self.__dict__)
             @attr.s()
             class FeatureConfig(_Config):
                 """Hold configuration values about the available revlog features"""
                 # the default compression engine
                 compression_engine = attr.ib(default=b'zlib')
                 # compression engines options
                 compression_engine_options = attr.ib(default=attr.Factory(dict))
                 # can we use censor on this revlog
                 censorable = attr.ib(default=False)
                 # does this revlog use the "side data" feature
                 has_side_data = attr.ib(default=False)
                 # might remove rank configuration once the computation has no impact
                 compute_rank = attr.ib(default=False)
                 # parent order is supposed to be semantically irrelevant, so we
                 # normally resort parents to ensure that the first parent is non-null,
                 # if there is a non-null parent at all.
                 # filelog abuses the parent order as flag to mark some instances of
                 # meta-encoded files, so allow it to disable this behavior.
                 canonical_parent_order = attr.ib(default=False)
                 # can ellipsis commit be used
                 enable_ellipsis = attr.ib(default=False)
                 def copy(self):
                     new = super().copy()
                     new.compression_engine_options = self.compression_engine_options.copy()
                     return new
             @attr.s()
             class DataConfig(_Config):
                 """Hold configuration value about how the revlog data are read"""
                 # should we try to open the "pending" version of the revlog
                 try_pending = attr.ib(default=False)
                 # should we try to open the "splitted" version of the revlog
                 try_split = attr.ib(default=False)
                 #  When True, indexfile should be opened with checkambig=True at writing,
                 #  to avoid file stat ambiguity.
                 check_ambig = attr.ib(default=False)
                 # If true, use mmap instead of reading to deal with large index
                 mmap_large_index = attr.ib(default=False)
                 # how much data is large
                 mmap_index_threshold = attr.ib(default=None)
                 # How much data to read and cache into the raw revlog data cache.
                 chunk_cache_size = attr.ib(default=65536)
                 # The size of the uncompressed cache compared to the largest revision seen.
                 uncompressed_cache_factor = attr.ib(default=None)
                 # The number of chunk cached
                 uncompressed_cache_count = attr.ib(default=None)
                 # Allow sparse reading of the revlog data
                 with_sparse_read = attr.ib(default=False)
                 # minimal density of a sparse read chunk
                 sr_density_threshold = attr.ib(default=0.50)
                 # minimal size of data we skip when performing sparse read
                 sr_min_gap_size = attr.ib(default=262144)
                 # are delta encoded against arbitrary bases.
                 generaldelta = attr.ib(default=False)
             @attr.s()
             class DeltaConfig(_Config):
                 """Hold configuration value about how new delta are computed
                 Some attributes are duplicated from DataConfig to help havign each object
                 self contained.
                 """
                 # can delta be encoded against arbitrary bases.
                 general_delta = attr.ib(default=False)
                 # Allow sparse writing of the revlog data
                 sparse_revlog = attr.ib(default=False)
                 # maximum length of a delta chain
                 max_chain_len = attr.ib(default=None)
                 # Maximum distance between delta chain base start and end
                 max_deltachain_span = attr.ib(default=-1)
                 # If `upper_bound_comp` is not None, this is the expected maximal gain from
                 # compression for the data content.
                 upper_bound_comp = attr.ib(default=None)
                 # Should we try a delta against both parent
                 delta_both_parents = attr.ib(default=True)
                 # Test delta base candidate group by chunk of this maximal size.
                 candidate_group_chunk_size = attr.ib(default=0)
                 # Should we display debug information about delta computation
                 debug_delta = attr.ib(default=False)
                 # trust incoming delta by default
                 lazy_delta = attr.ib(default=True)
                 # trust the base of incoming delta by default
                 lazy_delta_base = attr.ib(default=False)
             class _InnerRevlog:
                 """An inner layer of the revlog object
                 That layer exist to be able to delegate some operation to Rust, its
                 boundaries are arbitrary and based on what we can delegate to Rust.
                 """
                 def __init__(
                     self,
                     opener,
                     index,
                     index_file,
                     data_file,
                     sidedata_file,
                     inline,
                     data_config,
                     delta_config,
                     feature_config,
                     chunk_cache,
                     default_compression_header,
                 ):
                     self.opener = opener
                     self.index = index
                     self.index_file = index_file
                     self.data_file = data_file
                     self.sidedata_file = sidedata_file
                     self.inline = inline
                     self.data_config = data_config
                     self.delta_config = delta_config
                     self.feature_config = feature_config
                     # used during diverted write.
                     self._orig_index_file = None
                     self._default_compression_header = default_compression_header
                     # index
                     # 3-tuple of file handles being used for active writing.
                     self._writinghandles = None
                     self._segmentfile = randomaccessfile.randomaccessfile(
                         self.opener,
                         (self.index_file if self.inline else self.data_file),
                         self.data_config.chunk_cache_size,
                         chunk_cache,
                     )
                     self._segmentfile_sidedata = randomaccessfile.randomaccessfile(
                         self.opener,
                         self.sidedata_file,
                         self.data_config.chunk_cache_size,
                     )
                     # revlog header -> revlog compressor
                     self._decompressors = {}
                     # 3-tuple of (node, rev, text) for a raw revision.
                     self._revisioncache = None
                     # cache some uncompressed chunks
                     # rev → uncompressed_chunk
                     #
                     # the max cost is dynamically updated to be proportionnal to the
                     # size of revision we actually encounter.
                     self._uncompressed_chunk_cache = None
                     if self.data_config.uncompressed_cache_factor is not None:
                         self._uncompressed_chunk_cache = util.lrucachedict(
                             self.data_config.uncompressed_cache_count,
                             maxcost=65536,  # some arbitrary initial value
                         )
                     self._delay_buffer = None
                 def __len__(self):
                     return len(self.index)
                 def clear_cache(self):
                     assert not self.is_delaying
                     self._revisioncache = None
                     if self._uncompressed_chunk_cache is not None:
                         self._uncompressed_chunk_cache.clear()
                     self._segmentfile.clear_cache()
                     self._segmentfile_sidedata.clear_cache()
                 @property
                 def canonical_index_file(self):
                     if self._orig_index_file is not None:
                         return self._orig_index_file
                     return self.index_file
                 @property
                 def is_delaying(self):
                     """is the revlog is currently delaying the visibility of written data?
                     The delaying mechanism can be either in-memory or written on disk in a
                     side-file."""
                     return (self._delay_buffer is not None) or (
                         self._orig_index_file is not None
                     )
                 # Derived from index values.
                 def start(self, rev):
                     """the offset of the data chunk for this revision"""
                     return int(self.index[rev][0] >> 16)
                 def length(self, rev):
                     """the length of the data chunk for this revision"""
                     return self.index[rev][1]
                 def end(self, rev):
                     """the end of the data chunk for this revision"""
                     return self.start(rev) + self.length(rev)
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self.delta_config.general_delta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     if not self.delta_config.sparse_revlog:
                         return self.deltaparent(rev) == nullrev
                     elif hasattr(self.index, 'issnapshot'):
                         # directly assign the method to cache the testing and access
                         self.issnapshot = self.index.issnapshot
                         return self.issnapshot(rev)
                     if rev == nullrev:
                         return True
                     entry = self.index[rev]
                     base = entry[3]
                     if base == rev:
                         return True
                     if base == nullrev:
                         return True
                     p1 = entry[5]
                     while self.length(p1) == 0:
                         b = self.deltaparent(p1)
                         if b == p1:
                             break
                         p1 = b
                     p2 = entry[6]
                     while self.length(p2) == 0:
                         b = self.deltaparent(p2)
                         if b == p2:
                             break
                         p2 = b
                     if base == p1 or base == p2:
                         return False
                     return self.issnapshot(base)
                 def _deltachain(self, rev, stoprev=None):
                     """Obtain the delta chain for a revision.
                     ``stoprev`` specifies a revision to stop at. If not specified, we
                     stop at the base of the chain.
                     Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
                     revs in ascending order and ``stopped`` is a bool indicating whether
                     ``stoprev`` was hit.
                     """
                     generaldelta = self.delta_config.general_delta
                     # Try C implementation.
                     try:
                         return self.index.deltachain(rev, stoprev, generaldelta)
                     except AttributeError:
                         pass
                     chain = []
                     # Alias to prevent attribute lookup in tight loop.
                     index = self.index
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != stoprev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == stoprev:
                         stopped = True
                     else:
                         chain.append(iterrev)
                         stopped = False
                     chain.reverse()
                     return chain, stopped
                 @util.propertycache
                 def _compressor(self):
                     engine = util.compengines[self.feature_config.compression_engine]
                     return engine.revlogcompressor(
                         self.feature_config.compression_engine_options
                     )
                 @util.propertycache
                 def _decompressor(self):
                     """the default decompressor"""
                     if self._default_compression_header is None:
                         return None
                     t = self._default_compression_header
                     c = self._get_decompressor(t)
                     return c.decompress
                 def _get_decompressor(self, t):
                     try:
                         compressor = self._decompressors[t]
                     except KeyError:
                         try:
                             engine = util.compengines.forrevlogheader(t)
                             compressor = engine.revlogcompressor(
                                 self.feature_config.compression_engine_options
                             )
                             self._decompressors[t] = compressor
                         except KeyError:
                             raise error.RevlogError(
                                 _(b'unknown compression type %s') % binascii.hexlify(t)
                             )
                     return compressor
                 def compress(self, data):
                     """Generate a possibly-compressed representation of data."""
                     if not data:
                         return b'', data
                     compressed = self._compressor.compress(data)
                     if compressed:
                         # The revlog compressor added the header in the returned data.
                         return b'', compressed
                     if data[0:1] == b'\0':
                         return b'', data
                     return b'u', data
                 def decompress(self, data):
                     """Decompress a revlog chunk.
                     The chunk is expected to begin with a header identifying the
                     format type so it can be routed to an appropriate decompressor.
                     """
                     if not data:
                         return data
                     # Revlogs are read much more frequently than they are written and many
                     # chunks only take microseconds to decompress, so performance is
                     # important here.
                     #
                     # We can make a few assumptions about revlogs:
                     #
                     # 1) the majority of chunks will be compressed (as opposed to inline
                     #    raw data).
                     # 2) decompressing *any* data will likely by at least 10x slower than
                     #    returning raw inline data.
                     # 3) we want to prioritize common and officially supported compression
                     #    engines
                     #
                     # It follows that we want to optimize for "decompress compressed data
                     # when encoded with common and officially supported compression engines"
                     # case over "raw data" and "data encoded by less common or non-official
                     # compression engines." That is why we have the inline lookup first
                     # followed by the compengines lookup.
                     #
                     # According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
                     # compressed chunks. And this matters for changelog and manifest reads.
                     t = data[0:1]
                     if t == b'x':
                         try:
                             return _zlibdecompress(data)
                         except zlib.error as e:
                             raise error.RevlogError(
                                 _(b'revlog decompress error: %s')
                                 % stringutil.forcebytestr(e)
                             )
                     # '\0' is more common than 'u' so it goes first.
                     elif t == b'\0':
                         return data
                     elif t == b'u':
                         return util.buffer(data, 1)
                     compressor = self._get_decompressor(t)
                     return compressor.decompress(data)
                 @contextlib.contextmanager
                 def reading(self):
                     """Context manager that keeps data and sidedata files open for reading"""
                     if len(self.index) == 0:
                         yield  # nothing to be read
                     elif self._delay_buffer is not None and self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     else:
                         with self._segmentfile.reading():
                             with self._segmentfile_sidedata.reading():
                                 yield
                 @property
                 def is_writing(self):
                     """True is a writing context is open"""
                     return self._writinghandles is not None
                 @property
                 def is_open(self):
                     """True if any file handle is being held
                     Used for assert and debug in the python code"""
                     return self._segmentfile.is_open or self._segmentfile_sidedata.is_open
                 @contextlib.contextmanager
                 def writing(self, transaction, data_end=None, sidedata_end=None):
                     """Open the revlog files for writing
                     Add content to a revlog should be done within such context.
                     """
                     if self.is_writing:
                         yield
                     else:
                         ifh = dfh = sdfh = None
                         try:
                             r = len(self.index)
                             # opening the data file.
                             dsize = 0
                             if r:
                                 dsize = self.end(r - 1)
                             dfh = None
                             if not self.inline:
                                 try:
                                     dfh = self.opener(self.data_file, mode=b"r+")
                                     if data_end is None:
                                         dfh.seek(0, os.SEEK_END)
                                     else:
                                         dfh.seek(data_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     dfh = self.opener(self.data_file, mode=b"w+")
                                 transaction.add(self.data_file, dsize)
                             if self.sidedata_file is not None:
                                 assert sidedata_end is not None
                                 # revlog-v2 does not inline, help Pytype
                                 assert dfh is not None
                                 try:
                                     sdfh = self.opener(self.sidedata_file, mode=b"r+")
                                     dfh.seek(sidedata_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     sdfh = self.opener(self.sidedata_file, mode=b"w+")
                                 transaction.add(self.sidedata_file, sidedata_end)
                             # opening the index file.
                             isize = r * self.index.entry_size
                             ifh = self.__index_write_fp()
                             if self.inline:
                                 transaction.add(self.index_file, dsize + isize)
                             else:
                                 transaction.add(self.index_file, isize)
                             # exposing all file handle for writing.
                             self._writinghandles = (ifh, dfh, sdfh)
                             self._segmentfile.writing_handle = ifh if self.inline else dfh
                             self._segmentfile_sidedata.writing_handle = sdfh
                             yield
                         finally:
                             self._writinghandles = None
                             self._segmentfile.writing_handle = None
                             self._segmentfile_sidedata.writing_handle = None
                             if dfh is not None:
                                 dfh.close()
                             if sdfh is not None:
                                 sdfh.close()
                             # closing the index file last to avoid exposing referent to
                             # potential unflushed data content.
                             if ifh is not None:
                                 ifh.close()
                 def __index_write_fp(self, index_end=None):
                     """internal method to open the index file for writing
                     You should not use this directly and use `_writing` instead
                     """
                     try:
                         if self._delay_buffer is None:
                             f = self.opener(
                                 self.index_file,
                                 mode=b"r+",
                                 checkambig=self.data_config.check_ambig,
                             )
                         else:
                             # check_ambig affect we way we open file for writing, however
                             # here, we do not actually open a file for writting as write
                             # will appened to a delay_buffer. So check_ambig is not
                             # meaningful and unneeded here.
                             f = randomaccessfile.appender(
                                 self.opener, self.index_file, b"r+", self._delay_buffer
                             )
                         if index_end is None:
                             f.seek(0, os.SEEK_END)
                         else:
                             f.seek(index_end, os.SEEK_SET)
                         return f
                     except FileNotFoundError:
                         if self._delay_buffer is None:
                             return self.opener(
                                 self.index_file,
                                 mode=b"w+",
                                 checkambig=self.data_config.check_ambig,
                             )
                         else:
                             return randomaccessfile.appender(
                                 self.opener, self.index_file, b"w+", self._delay_buffer
                             )
                 def __index_new_fp(self):
                     """internal method to create a new index file for writing
                     You should not use this unless you are upgrading from inline revlog
                     """
                     return self.opener(
                         self.index_file,
                         mode=b"w",
                         checkambig=self.data_config.check_ambig,
                         atomictemp=True,
                     )
                 def split_inline(self, tr, header, new_index_file_path=None):
                     """split the data of an inline revlog into an index and a data file"""
                     assert self._delay_buffer is None
                     existing_handles = False
                     if self._writinghandles is not None:
                         existing_handles = True
                         fp = self._writinghandles[0]
                         fp.flush()
                         fp.close()
                         # We can't use the cached file handle after close(). So prevent
                         # its usage.
                         self._writinghandles = None
                         self._segmentfile.writing_handle = None
                         # No need to deal with sidedata writing handle as it is only
                         # relevant with revlog-v2 which is never inline, not reaching
                         # this code
                     new_dfh = self.opener(self.data_file, mode=b"w+")
                     new_dfh.truncate(0)  # drop any potentially existing data
                     try:
                         with self.reading():
                             for r in range(len(self.index)):
                                 new_dfh.write(self.get_segment_for_revs(r, r)[1])
                             new_dfh.flush()
                         if new_index_file_path is not None:
                             self.index_file = new_index_file_path
                         with self.__index_new_fp() as fp:
                             self.inline = False
                             for i in range(len(self.index)):
                                 e = self.index.entry_binary(i)
                                 if i == 0:
                                     packed_header = self.index.pack_header(header)
                                     e = packed_header + e
                                 fp.write(e)
                             # If we don't use side-write, the temp file replace the real
                             # index when we exit the context manager
                         self._segmentfile = randomaccessfile.randomaccessfile(
                             self.opener,
                             self.data_file,
                             self.data_config.chunk_cache_size,
                         )
                         if existing_handles:
                             # switched from inline to conventional reopen the index
                             ifh = self.__index_write_fp()
                             self._writinghandles = (ifh, new_dfh, None)
                             self._segmentfile.writing_handle = new_dfh
                             new_dfh = None
                             # No need to deal with sidedata writing handle as it is only
                             # relevant with revlog-v2 which is never inline, not reaching
                             # this code
                     finally:
                         if new_dfh is not None:
                             new_dfh.close()
                     return self.index_file
                 def get_segment_for_revs(self, startrev, endrev):
                     """Obtain a segment of raw data corresponding to a range of revisions.
                     Accepts the start and end revisions and an optional already-open
                     file handle to be used for reading. If the file handle is read, its
                     seek position will not be preserved.
                     Requests for data may be satisfied by a cache.
                     Returns a 2-tuple of (offset, data) for the requested range of
                     revisions. Offset is the integer offset from the beginning of the
                     revlog and data is a str or buffer of the raw byte data.
                     Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
                     to determine where each revision's data begins and ends.
                     API: we should consider making this a private part of the InnerRevlog
                     at some point.
                     """
                     # Inlined self.start(startrev) & self.end(endrev) for perf reasons
                     # (functions are expensive).
                     index = self.index
                     istart = index[startrev]
                     start = int(istart[0] >> 16)
                     if startrev == endrev:
                         end = start + istart[1]
                     else:
                         iend = index[endrev]
                         end = int(iend[0] >> 16) + iend[1]
                     if self.inline:
                         start += (startrev + 1) * self.index.entry_size
                         end += (endrev + 1) * self.index.entry_size
                     length = end - start
                     return start, self._segmentfile.read_chunk(start, length)
                 def _chunk(self, rev):
                     """Obtain a single decompressed chunk for a revision.
                     Accepts an integer revision and an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will not
                     be preserved.
                     Returns a str holding uncompressed data for the requested revision.
                     """
                     if self._uncompressed_chunk_cache is not None:
                         uncomp = self._uncompressed_chunk_cache.get(rev)
                         if uncomp is not None:
                             return uncomp
                     compression_mode = self.index[rev][10]
                     data = self.get_segment_for_revs(rev, rev)[1]
                     if compression_mode == COMP_MODE_PLAIN:
                         uncomp = data
                     elif compression_mode == COMP_MODE_DEFAULT:
                         uncomp = self._decompressor(data)
                     elif compression_mode == COMP_MODE_INLINE:
                         uncomp = self.decompress(data)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= compression_mode
                         raise error.RevlogError(msg)
                     if self._uncompressed_chunk_cache is not None:
                         self._uncompressed_chunk_cache.insert(rev, uncomp, cost=len(uncomp))
                     return uncomp
                 def _chunks(self, revs, targetsize=None):
                     """Obtain decompressed chunks for the specified revisions.
                     Accepts an iterable of numeric revisions that are assumed to be in
                     ascending order. Also accepts an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will
                     not be preserved.
                     This function is similar to calling ``self._chunk()`` multiple times,
                     but is faster.
                     Returns a list with decompressed data for each requested revision.
                     """
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self.inline
                     iosize = self.index.entry_size
                     buffer = util.buffer
                     fetched_revs = []
                     fadd = fetched_revs.append
                     chunks = []
                     ladd = chunks.append
                     if self._uncompressed_chunk_cache is None:
                         fetched_revs = revs
                     else:
                         for rev in revs:
                             cached_value = self._uncompressed_chunk_cache.get(rev)
                             if cached_value is None:
                                 fadd(rev)
                             else:
                                 ladd((rev, cached_value))
                     if not fetched_revs:
                         slicedchunks = ()
                     elif not self.data_config.with_sparse_read:
                         slicedchunks = (fetched_revs,)
                     else:
                         slicedchunks = deltautil.slicechunk(
                             self,
                             fetched_revs,
                             targetsize=targetsize,
                         )
                     for revschunk in slicedchunks:
                         firstrev = revschunk[0]
                         # Skip trailing revisions with empty diff
                         for lastrev in revschunk[::-1]:
                             if length(lastrev) != 0:
                                 break
                         try:
                             offset, data = self.get_segment_for_revs(firstrev, lastrev)
                         except OverflowError:
                             # issue4215 - we can't cache a run of chunks greater than
                             # 2G on Windows
                             for rev in revschunk:
                                 ladd((rev, self._chunk(rev)))
                         decomp = self.decompress
                         # self._decompressor might be None, but will not be used in that case
                         def_decomp = self._decompressor
                         for rev in revschunk:
                             chunkstart = start(rev)
                             if inline:
                                 chunkstart += (rev + 1) * iosize
                             chunklength = length(rev)
                             comp_mode = self.index[rev][10]
                             c = buffer(data, chunkstart - offset, chunklength)
                             if comp_mode == COMP_MODE_PLAIN:
                                 c = c
                             elif comp_mode == COMP_MODE_INLINE:
                                 c = decomp(c)
                             elif comp_mode == COMP_MODE_DEFAULT:
                                 c = def_decomp(c)
                             else:
                                 msg = b'unknown compression mode %d'
                                 msg %= comp_mode
                                 raise error.RevlogError(msg)
                             ladd((rev, c))
                             if self._uncompressed_chunk_cache is not None:
                                 self._uncompressed_chunk_cache.insert(rev, c, len(c))
                     chunks.sort()
                     return [x[1] for x in chunks]
                 def raw_text(self, node, rev):
                     """return the possibly unvalidated rawtext for a revision
                     returns (rev, rawtext, validated)
                     """
                     # revision in the cache (could be useful to apply delta)
                     cachedrev = None
                     # An intermediate text to apply deltas to
                     basetext = None
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._revisioncache:
                         cachedrev = self._revisioncache[1]
                     chain, stopped = self._deltachain(rev, stoprev=cachedrev)
                     if stopped:
                         basetext = self._revisioncache[2]
                     # drop cache to save memory, the caller is expected to
                     # update self._inner._revisioncache after validating the text
                     self._revisioncache = None
                     targetsize = None
                     rawsize = self.index[rev][2]
                     if 0 <= rawsize:
                         targetsize = 4 * rawsize
                     if self._uncompressed_chunk_cache is not None:
                         # dynamically update the uncompressed_chunk_cache size to the
                         # largest revision we saw in this revlog.
                         factor = self.data_config.uncompressed_cache_factor
                         candidate_size = rawsize * factor
                         if candidate_size > self._uncompressed_chunk_cache.maxcost:
                             self._uncompressed_chunk_cache.maxcost = candidate_size
                     bins = self._chunks(chain, targetsize=targetsize)
                     if basetext is None:
                         basetext = bytes(bins[0])
                         bins = bins[1:]
                     rawtext = mdiff.patches(basetext, bins)
                     del basetext  # let us have a chance to free memory early
                     return (rev, rawtext, False)
                 def sidedata(self, rev, sidedata_end):
                     """Return the sidedata for a given revision number."""
                     index_entry = self.index[rev]
                     sidedata_offset = index_entry[8]
                     sidedata_size = index_entry[9]
                     if self.inline:
                         sidedata_offset += self.index.entry_size * (1 + rev)
                     if sidedata_size == 0:
                         return {}
                     if sidedata_end < sidedata_offset + sidedata_size:
                         filename = self.sidedata_file
                         end = sidedata_end
                         offset = sidedata_offset
                         length = sidedata_size
                         m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)
                         raise error.RevlogError(m)
                     comp_segment = self._segmentfile_sidedata.read_chunk(
                         sidedata_offset, sidedata_size
                     )
                     comp = self.index[rev][11]
                     if comp == COMP_MODE_PLAIN:
                         segment = comp_segment
                     elif comp == COMP_MODE_DEFAULT:
                         segment = self._decompressor(comp_segment)
                     elif comp == COMP_MODE_INLINE:
                         segment = self.decompress(comp_segment)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= comp
                         raise error.RevlogError(msg)
                     sidedata = sidedatautil.deserialize_sidedata(segment)
                     return sidedata
                 def write_entry(
                     self,
                     transaction,
                     entry,
                     data,
                     link,
                     offset,
                     sidedata,
                     sidedata_offset,
                     index_end,
                     data_end,
                     sidedata_end,
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     if self._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     ifh, dfh, sdfh = self._writinghandles
                     if index_end is None:
                         ifh.seek(0, os.SEEK_END)
                     else:
                         ifh.seek(index_end, os.SEEK_SET)
                     if dfh:
                         if data_end is None:
                             dfh.seek(0, os.SEEK_END)
                         else:
                             dfh.seek(data_end, os.SEEK_SET)
                     if sdfh:
                         sdfh.seek(sidedata_end, os.SEEK_SET)
                     curr = len(self.index) - 1
                     if not self.inline:
                         transaction.add(self.data_file, offset)
                         if self.sidedata_file:
                             transaction.add(self.sidedata_file, sidedata_offset)
                         transaction.add(self.canonical_index_file, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         if sidedata:
                             sdfh.write(sidedata)
                         if self._delay_buffer is None:
                             ifh.write(entry)
                         else:
                             self._delay_buffer.append(entry)
                     elif self._delay_buffer is not None:
                         msg = b'invalid delayed write on inline revlog'
                         raise error.ProgrammingError(msg)
                     else:
                         offset += curr * self.index.entry_size
                         transaction.add(self.canonical_index_file, offset)
                         assert not sidedata
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                     return (
                         ifh.tell(),
                         dfh.tell() if dfh else None,
                         sdfh.tell() if sdfh else None,
                     )
                 def _divert_index(self):
                     return self.index_file + b'.a'
                 def delay(self):
                     assert not self.is_open
                     if self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     if self._delay_buffer is not None or self._orig_index_file is not None:
                         # delay or divert already in place
                         return None
                     elif len(self.index) == 0:
                         self._orig_index_file = self.index_file
                         self.index_file = self._divert_index()
                         assert self._orig_index_file is not None
                         assert self.index_file is not None
                         if self.opener.exists(self.index_file):
                             self.opener.unlink(self.index_file)
                         return self.index_file
                     else:
                         self._delay_buffer = []
                         return None
                 def write_pending(self):
                     assert not self.is_open
                     if self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     if self._orig_index_file is not None:
                         return None, True
                     any_pending = False
                     pending_index_file = self._divert_index()
                     if self.opener.exists(pending_index_file):
                         self.opener.unlink(pending_index_file)
                     util.copyfile(
                         self.opener.join(self.index_file),
                         self.opener.join(pending_index_file),
                     )
                     if self._delay_buffer:
                         with self.opener(pending_index_file, b'r+') as ifh:
                             ifh.seek(0, os.SEEK_END)
                             ifh.write(b"".join(self._delay_buffer))
                         any_pending = True
                     self._delay_buffer = None
                     self._orig_index_file = self.index_file
                     self.index_file = pending_index_file
                     return self.index_file, any_pending
                 def finalize_pending(self):
                     assert not self.is_open
                     if self.inline:
                         msg = "revlog with delayed write should not be inline"
                         raise error.ProgrammingError(msg)
                     delay = self._delay_buffer is not None
                     divert = self._orig_index_file is not None
                     if delay and divert:
                         assert False, "unreachable"
                     elif delay:
                         if self._delay_buffer:
                             with self.opener(self.index_file, b'r+') as ifh:
                                 ifh.seek(0, os.SEEK_END)
                                 ifh.write(b"".join(self._delay_buffer))
                         self._delay_buffer = None
                     elif divert:
                         if self.opener.exists(self.index_file):
                             self.opener.rename(
                                 self.index_file,
                                 self._orig_index_file,
                                 checkambig=True,
                             )
                         self.index_file = self._orig_index_file
                         self._orig_index_file = None
                     else:
                         msg = b"not delay or divert found on this revlog"
                         raise error.ProgrammingError(msg)
                     return self.canonical_index_file
             class revlog:
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 If checkambig, indexfile is opened with checkambig=True at
                 writing, to avoid file stat ambiguity.
                 If mmaplargeindex is True, and an mmapindexthreshold is set, the
                 index will be mmapped rather than read if it is larger than the
                 configured threshold.
                 If censorable is True, the revlog can have censored revisions.
                 If `upperboundcomp` is not None, this is the expected maximal gain from
                 compression for the data content.
                 `concurrencychecker` is an optional function that receives 3 arguments: a
                 file handle, a filename, and an expected position. It should check whether
                 the current position in the file handle is valid, and log/warn/fail (by
                 raising).
                 See mercurial/revlogutils/contants.py for details about the content of an
                 index entry.
                 """
                 _flagserrorclass = error.RevlogError
                 @staticmethod
                 def is_inline_index(header_bytes):
                     """Determine if a revlog is inline from the initial bytes of the index"""
                     if len(header_bytes) == 0:
                         return True
                     header = INDEX_HEADER.unpack(header_bytes)[0]
                     _format_flags = header & ~0xFFFF
                     _format_version = header & 0xFFFF
                     features = FEATURES_BY_VERSION[_format_version]
                     return features[b'inline'](_format_flags)
                 def __init__(
                     self,
                     opener,
                     target,
                     radix,
                     postfix=None,  # only exist for `tmpcensored` now
                     checkambig=False,
                     mmaplargeindex=False,
                     censorable=False,
                     upperboundcomp=None,
                     persistentnodemap=False,
                     concurrencychecker=None,
                     trypending=False,
                     try_split=False,
                     canonical_parent_order=True,
                     data_config=None,
                     delta_config=None,
                     feature_config=None,
                     may_inline=True,  # may inline new revlog
                 ):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     `target`: a (KIND, ID) tuple that identify the content stored in
                     this revlog. It help the rest of the code to understand what the revlog
                     is about without having to resort to heuristic and index filename
                     analysis. Note: that this must be reliably be set by normal code, but
                     that test, debug, or performance measurement code might not set this to
                     accurate value.
                     """
                     self.radix = radix
                     self._docket_file = None
                     self._indexfile = None
                     self._datafile = None
                     self._sidedatafile = None
                     self._nodemap_file = None
                     self.postfix = postfix
                     self._trypending = trypending
                     self._try_split = try_split
                     self._may_inline = may_inline
                     self.opener = opener
                     if persistentnodemap:
                         self._nodemap_file = nodemaputil.get_nodemap_file(self)
                     assert target[0] in ALL_KINDS
                     assert len(target) == 2
                     self.target = target
                     if feature_config is not None:
                         self.feature_config = feature_config.copy()
                     elif b'feature-config' in self.opener.options:
                         self.feature_config = self.opener.options[b'feature-config'].copy()
                     else:
                         self.feature_config = FeatureConfig()
                     self.feature_config.censorable = censorable
                     self.feature_config.canonical_parent_order = canonical_parent_order
                     if data_config is not None:
                         self.data_config = data_config.copy()
                     elif b'data-config' in self.opener.options:
                         self.data_config = self.opener.options[b'data-config'].copy()
                     else:
                         self.data_config = DataConfig()
                     self.data_config.check_ambig = checkambig
                     self.data_config.mmap_large_index = mmaplargeindex
                     if delta_config is not None:
                         self.delta_config = delta_config.copy()
                     elif b'delta-config' in self.opener.options:
                         self.delta_config = self.opener.options[b'delta-config'].copy()
                     else:
                         self.delta_config = DeltaConfig()
                     self.delta_config.upper_bound_comp = upperboundcomp
                     # Maps rev to chain base rev.
                     self._chainbasecache = util.lrucachedict(100)
                     self.index = None
                     self._docket = None
                     self._nodemap_docket = None
                     # Mapping of partial identifiers to full nodes.
                     self._pcache = {}
                     # other optionnals features
                     # Make copy of flag processors so each revlog instance can support
                     # custom flags.
                     self._flagprocessors = dict(flagutil.flagprocessors)
                     # prevent nesting of addgroup
                     self._adding_group = None
                     chunk_cache = self._loadindex()
                     self._load_inner(chunk_cache)
                     self._concurrencychecker = concurrencychecker
                 def _init_opts(self):
                     """process options (from above/config) to setup associated default revlog mode
                     These values might be affected when actually reading on disk information.
                     The relevant values are returned for use in _loadindex().
                     * newversionflags:
                         version header to use if we need to create a new revlog
                     * mmapindexthreshold:
                         minimal index size for start to use mmap
                     * force_nodemap:
                         force the usage of a "development" version of the nodemap code
                     """
                     opts = self.opener.options
                     if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:
                         new_header = CHANGELOGV2
                         compute_rank = opts.get(b'changelogv2.compute-rank', True)
                         self.feature_config.compute_rank = compute_rank
                     elif b'revlogv2' in opts:
                         new_header = REVLOGV2
                     elif b'revlogv1' in opts:
                         new_header = REVLOGV1
                         if self._may_inline:
                             new_header |= FLAG_INLINE_DATA
                         if b'generaldelta' in opts:
                             new_header |= FLAG_GENERALDELTA
                     elif b'revlogv0' in self.opener.options:
                         new_header = REVLOGV0
                     else:
                         new_header = REVLOG_DEFAULT_VERSION
                     mmapindexthreshold = None
                     if self.data_config.mmap_large_index:
                         mmapindexthreshold = self.data_config.mmap_index_threshold
                     if self.feature_config.enable_ellipsis:
                         self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor
                     # revlog v0 doesn't have flag processors
                     for flag, processor in opts.get(b'flagprocessors', {}).items():
                         flagutil.insertflagprocessor(flag, processor, self._flagprocessors)
                     chunk_cache_size = self.data_config.chunk_cache_size
                     if chunk_cache_size <= 0:
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not greater than 0')
                             % chunk_cache_size
                         )
                     elif chunk_cache_size & (chunk_cache_size - 1):
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not a power of 2')
                             % chunk_cache_size
                         )
                     force_nodemap = opts.get(b'devel-force-nodemap', False)
                     return new_header, mmapindexthreshold, force_nodemap
                 def _get_data(self, filepath, mmap_threshold, size=None):
                     """return a file content with or without mmap
                     If the file is missing return the empty string"""
                     try:
                         with self.opener(filepath) as fp:
                             if mmap_threshold is not None:
                                 file_size = self.opener.fstat(fp).st_size
                                 if file_size >= mmap_threshold:
                                     if size is not None:
                                         # avoid potentiel mmap crash
                                         size = min(file_size, size)
                                     # TODO: should .close() to release resources without
                                     # relying on Python GC
                                     if size is None:
                                         return util.buffer(util.mmapread(fp))
                                     else:
                                         return util.buffer(util.mmapread(fp, size))
                             if size is None:
                                 return fp.read()
                             else:
                                 return fp.read(size)
                     except FileNotFoundError:
                         return b''
                 def get_streams(self, max_linkrev, force_inline=False):
                     """return a list of streams that represent this revlog
                     This is used by stream-clone to do bytes to bytes copies of a repository.
                     This streams data for all revisions that refer to a changelog revision up
                     to `max_linkrev`.
                     If `force_inline` is set, it enforces that the stream will represent an inline revlog.
                     It returns is a list of three-tuple:
                         [
                             (filename, bytes_stream, stream_size),
                             …
                         ]
                     """
                     n = len(self)
                     index = self.index
                     while n > 0:
                         linkrev = index[n - 1][4]
                         if linkrev < max_linkrev:
                             break
                         # note: this loop will rarely go through multiple iterations, since
                         # it only traverses commits created during the current streaming
                         # pull operation.
                         #
                         # If this become a problem, using a binary search should cap the
                         # runtime of this.
                         n = n - 1
                     if n == 0:
                         # no data to send
                         return []
                     index_size = n * index.entry_size
                     data_size = self.end(n - 1)
                     # XXX we might have been split (or stripped) since the object
                     # initialization, We need to close this race too, but having a way to
                     # pre-open the file we feed to the revlog and never closing them before
                     # we are done streaming.
                     if self._inline:
                         def get_stream():
                             with self.opener(self._indexfile, mode=b"r") as fp:
                                 yield None
                                 size = index_size + data_size
                                 if size <= 65536:
                                     yield fp.read(size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=size)
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     elif force_inline:
                         def get_stream():
                             with self.reading():
                                 yield None
                                 for rev in range(n):
                                     idx = self.index.entry_binary(rev)
                                     if rev == 0 and self._docket is None:
                                         # re-inject the inline flag
                                         header = self._format_flags
                                         header |= self._format_version
                                         header |= FLAG_INLINE_DATA
                                         header = self.index.pack_header(header)
                                         idx = header + idx
                                     yield idx
                                     yield self._inner.get_segment_for_revs(rev, rev)[1]
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     else:
                         def get_index_stream():
                             with self.opener(self._indexfile, mode=b"r") as fp:
                                 yield None
                                 if index_size <= 65536:
                                     yield fp.read(index_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=index_size)
                         def get_data_stream():
                             with self._datafp() as fp:
                                 yield None
                                 if data_size <= 65536:
                                     yield fp.read(data_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=data_size)
                         index_stream = get_index_stream()
                         next(index_stream)
                         data_stream = get_data_stream()
                         next(data_stream)
                         return [
                             (self._datafile, data_stream, data_size),
                             (self._indexfile, index_stream, index_size),
                         ]
                 def _loadindex(self, docket=None):
                     new_header, mmapindexthreshold, force_nodemap = self._init_opts()
                     if self.postfix is not None:
                         entry_point = b'%s.i.%s' % (self.radix, self.postfix)
                     elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):
                         entry_point = b'%s.i.a' % self.radix
                     elif self._try_split and self.opener.exists(self._split_index_file):
                         entry_point = self._split_index_file
                     else:
                         entry_point = b'%s.i' % self.radix
                     if docket is not None:
                         self._docket = docket
                         self._docket_file = entry_point
                     else:
                         self._initempty = True
                         entry_data = self._get_data(entry_point, mmapindexthreshold)
                         if len(entry_data) > 0:
                             header = INDEX_HEADER.unpack(entry_data[:4])[0]
                             self._initempty = False
                         else:
                             header = new_header
                         self._format_flags = header & ~0xFFFF
                         self._format_version = header & 0xFFFF
                         supported_flags = SUPPORTED_FLAGS.get(self._format_version)
                         if supported_flags is None:
                             msg = _(b'unknown version (%d) in revlog %s')
                             msg %= (self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         elif self._format_flags & ~supported_flags:
                             msg = _(b'unknown flags (%#04x) in version %d revlog %s')
                             display_flag = self._format_flags >> 16
                             msg %= (display_flag, self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         features = FEATURES_BY_VERSION[self._format_version]
                         self._inline = features[b'inline'](self._format_flags)
                         self.delta_config.general_delta = features[b'generaldelta'](
                             self._format_flags
                         )
                         self.feature_config.has_side_data = features[b'sidedata']
                         if not features[b'docket']:
                             self._indexfile = entry_point
                             index_data = entry_data
                         else:
                             self._docket_file = entry_point
                             if self._initempty:
                                 self._docket = docketutil.default_docket(self, header)
                             else:
                                 self._docket = docketutil.parse_docket(
                                     self, entry_data, use_pending=self._trypending
                                 )
                     if self._docket is not None:
                         self._indexfile = self._docket.index_filepath()
                         index_data = b''
                         index_size = self._docket.index_end
                         if index_size > 0:
                             index_data = self._get_data(
                                 self._indexfile, mmapindexthreshold, size=index_size
                             )
                             if len(index_data) < index_size:
                                 msg = _(b'too few index data for %s: got %d, expected %d')
                                 msg %= (self.display_id, len(index_data), index_size)
                                 raise error.RevlogError(msg)
                         self._inline = False
                         # generaldelta implied by version 2 revlogs.
                         self.delta_config.general_delta = True
                         # the logic for persistent nodemap will be dealt with within the
                         # main docket, so disable it for now.
                         self._nodemap_file = None
                     if self._docket is not None:
                         self._datafile = self._docket.data_filepath()
                         self._sidedatafile = self._docket.sidedata_filepath()
                     elif self.postfix is None:
                         self._datafile = b'%s.d' % self.radix
                     else:
                         self._datafile = b'%s.d.%s' % (self.radix, self.postfix)
                     self.nodeconstants = sha1nodeconstants
                     self.nullid = self.nodeconstants.nullid
                     # sparse-revlog can't be on without general-delta (issue6056)
                     if not self.delta_config.general_delta:
                         self.delta_config.sparse_revlog = False
                     self._storedeltachains = True
                     devel_nodemap = (
                         self._nodemap_file
                         and force_nodemap
                         and parse_index_v1_nodemap is not None
                     )
                     use_rust_index = False
                     if rustrevlog is not None:
                         if self._nodemap_file is not None:
                             use_rust_index = True
                         else:
                             # Using the CIndex is not longer possible, as the
                             # `AncestorsIterator` and `LazyAncestors` classes now require
                             # a Rust index for instantiation.
                             use_rust_index = True
                     self._parse_index = parse_index_v1
                     if self._format_version == REVLOGV0:
                         self._parse_index = revlogv0.parse_index_v0
                     elif self._format_version == REVLOGV2:
                         self._parse_index = parse_index_v2
                     elif self._format_version == CHANGELOGV2:
                         self._parse_index = parse_index_cl_v2
                     elif devel_nodemap:
                         self._parse_index = parse_index_v1_nodemap
                     elif use_rust_index:
                         self._parse_index = functools.partial(
                             parse_index_v1_rust, default_header=new_header
                         )
                     try:
                         d = self._parse_index(index_data, self._inline)
                         index, chunkcache = d
                         use_nodemap = (
                             not self._inline
                             and self._nodemap_file is not None
                             and hasattr(index, 'update_nodemap_data')
                         )
                         if use_nodemap:
                             nodemap_data = nodemaputil.persisted_data(self)
                             if nodemap_data is not None:
                                 docket = nodemap_data[0]
                                 if (
                                     len(d[0]) > docket.tip_rev
                                     and d[0][docket.tip_rev][7] == docket.tip_node
                                 ):
                                     # no changelog tampering
                                     self._nodemap_docket = docket
                                     index.update_nodemap_data(*nodemap_data)
                     except (ValueError, IndexError):
                         raise error.RevlogError(
                             _(b"index %s is corrupted") % self.display_id
                         )
                     self.index = index
                     # revnum -> (chain-length, sum-delta-length)
                     self._chaininfocache = util.lrucachedict(500)
                     return chunkcache
                 def _load_inner(self, chunk_cache):
                     if self._docket is None:
                         default_compression_header = None
                     else:
                         default_compression_header = self._docket.default_compression_header
                     self._inner = _InnerRevlog(
                         opener=self.opener,
                         index=self.index,
                         index_file=self._indexfile,
                         data_file=self._datafile,
                         sidedata_file=self._sidedatafile,
                         inline=self._inline,
                         data_config=self.data_config,
                         delta_config=self.delta_config,
                         feature_config=self.feature_config,
                         chunk_cache=chunk_cache,
                         default_compression_header=default_compression_header,
                     )
                 def get_revlog(self):
                     """simple function to mirror API of other not-really-revlog API"""
                     return self
                 @util.propertycache
                 def revlog_kind(self):
                     return self.target[0]
                 @util.propertycache
                 def display_id(self):
                     """The public facing "ID" of the revlog that we use in message"""
                     if self.revlog_kind == KIND_FILELOG:
                         # Reference the file without the "data/" prefix, so it is familiar
                         # to the user.
                         return self.target[1]
                     else:
                         return self.radix
                 def _datafp(self, mode=b'r'):
                     """file object for the revlog's data file"""
                     return self.opener(self._datafile, mode=mode)
                 def tiprev(self):
                     return len(self.index) - 1
                 def tip(self):
                     return self.node(self.tiprev())
                 def __contains__(self, rev):
                     return 0 <= rev < len(self)
                 def __len__(self):
                     return len(self.index)
                 def __iter__(self):
                     return iter(range(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     return storageutil.iterrevs(len(self), start=start, stop=stop)
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def _candelta(self, baserev, rev):
                     """whether two revisions (baserev, rev) can be delta-ed or not"""
                     # Disable delta if either rev requires a content-changing flag
                     # processor (ex. LFS). This is because such flag processor can alter
                     # the rawtext content that the delta will be based on, and two clients
                     # could have a same revlog node with different flags (i.e. different
                     # rawtext contents) and the delta could be incompatible.
                     if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (
                         self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS
                     ):
                         return False
                     return True
                 def update_caches(self, transaction):
                     """update on disk cache
                     If a transaction is passed, the update may be delayed to transaction
                     commit."""
                     if self._nodemap_file is not None:
                         if transaction is None:
                             nodemaputil.update_persistent_nodemap(self)
                         else:
                             nodemaputil.setup_persistent_nodemap(transaction, self)
                 def clearcaches(self):
                     """Clear in-memory caches"""
                     self._chainbasecache.clear()
                     self._inner.clear_cache()
                     self._pcache = {}
                     self._nodemap_docket = None
                     self.index.clearcaches()
                     # The python code is the one responsible for validating the docket, we
                     # end up having to refresh it here.
                     use_nodemap = (
                         not self._inline
                         and self._nodemap_file is not None
                         and hasattr(self.index, 'update_nodemap_data')
                     )
                     if use_nodemap:
                         nodemap_data = nodemaputil.persisted_data(self)
                         if nodemap_data is not None:
                             self._nodemap_docket = nodemap_data[0]
                             self.index.update_nodemap_data(*nodemap_data)
                 def rev(self, node):
                     """return the revision number associated with a <nodeid>"""
                     try:
                         return self.index.rev(node)
                     except TypeError:
                         raise
                     except error.RevlogError:
                         # parsers.c radix tree lookup failed
                         if (
                             node == self.nodeconstants.wdirid
                             or node in self.nodeconstants.wdirfilenodeids
                         ):
                             raise error.WdirUnsupported
                         raise error.LookupError(node, self.display_id, _(b'no node'))
                 # Accessors for index entries.
                 # First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
                 # are flags.
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def sidedata_cut_off(self, rev):
                     sd_cut_off = self.index[rev][8]
                     if sd_cut_off != 0:
                         return sd_cut_off
                     # This is some annoying dance, because entries without sidedata
                     # currently use 0 as their ofsset. (instead of previous-offset +
                     # previous-size)
                     #
                     # We should reconsider this sidedata → 0 sidata_offset policy.
                     # In the meantime, we need this.
                     while 0 <= rev:
                         e = self.index[rev]
                         if e[9] != 0:
                             return e[8] + e[9]
                         rev -= 1
                     return 0
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def length(self, rev):
                     return self.index[rev][1]
                 def sidedata_length(self, rev):
                     if not self.feature_config.has_side_data:
                         return 0
                     return self.index[rev][9]
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.rawdata(rev)
                     return len(t)
                 def size(self, rev):
                     """length of non-raw text (processed by a "read" flag processor)"""
                     # fast path: if no "read" flag processor could change the content,
                     # size is rawsize. note: ELLIPSIS is known to not change the content.
                     flags = self.flags(rev)
                     if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
                         return self.rawsize(rev)
                     return len(self.revision(rev))
                 def fast_rank(self, rev):
                     """Return the rank of a revision if already known, or None otherwise.
                     The rank of a revision is the size of the sub-graph it defines as a
                     head. Equivalently, the rank of a revision `r` is the size of the set
                     `ancestors(r)`, `r` included.
                     This method returns the rank retrieved from the revlog in constant
                     time. It makes no attempt at computing unknown values for versions of
                     the revlog which do not persist the rank.
                     """
                     rank = self.index[rev][ENTRY_RANK]
                     if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:
                         return None
                     if rev == nullrev:
                         return 0  # convention
                     return rank
                 def chainbase(self, rev):
                     base = self._chainbasecache.get(rev)
                     if base is not None:
                         return base
                     index = self.index
                     iterrev = rev
                     base = index[iterrev][3]
                     while base != iterrev:
                         iterrev = base
                         base = index[iterrev][3]
                     self._chainbasecache[rev] = base
                     return base
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parentrevs(self, rev):
                     try:
                         entry = self.index[rev]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                     if self.feature_config.canonical_parent_order and entry[5] == nullrev:
                         return entry[6], entry[5]
                     else:
                         return entry[5], entry[6]
                 # fast parentrevs(rev) where rev isn't filtered
                 _uncheckedparentrevs = parentrevs
                 def node(self, rev):
                     try:
                         return self.index[rev][7]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                 # Derived from index values.
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     # inline node() to avoid function call overhead
                     if self.feature_config.canonical_parent_order and d[5] == self.nullid:
                         return i[d[6]][7], i[d[5]][7]
                     else:
                         return i[d[5]][7], i[d[6]][7]
                 def chainlen(self, rev):
                     return self._chaininfo(rev)[0]
                 def _chaininfo(self, rev):
                     chaininfocache = self._chaininfocache
                     if rev in chaininfocache:
                         return chaininfocache[rev]
                     index = self.index
                     generaldelta = self.delta_config.general_delta
                     iterrev = rev
                     e = index[iterrev]
                     clen = 0
                     compresseddeltalen = 0
                     while iterrev != e[3]:
                         clen += 1
                         compresseddeltalen += e[1]
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         if iterrev in chaininfocache:
                             t = chaininfocache[iterrev]
                             clen += t[0]
                             compresseddeltalen += t[1]
                             break
                         e = index[iterrev]
                     else:
                         # Add text length of base since decompressing that also takes
                         # work. For cache hits the length is already included.
                         compresseddeltalen += e[1]
                     r = (clen, compresseddeltalen)
                     chaininfocache[rev] = r
                     return r
                 def _deltachain(self, rev, stoprev=None):
                     return self._inner._deltachain(rev, stoprev=stoprev)
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse revision order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     # first, make sure start revisions aren't filtered
                     revs = list(revs)
                     checkrev = self.node
                     for r in revs:
                         checkrev(r)
                     # and we're sure ancestors aren't filtered as well
                     if rustancestor is not None and self.index.rust_ext_compat:
                         lazyancestors = rustancestor.LazyAncestors
                         arg = self.index
                     else:
                         lazyancestors = ancestor.lazyancestors
                         arg = self._uncheckedparentrevs
                     return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)
                 def descendants(self, revs):
                     return dagop.descendantrevs(revs, self.revs, self.parentrevs)
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset:
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = collections.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(miss) for miss in missing]
                 def incrementalmissingrevs(self, common=None):
                     """Return an object that can be used to incrementally compute the
                     revision numbers of the ancestors of arbitrary sets that are not
                     ancestors of common. This is an ancestor.incrementalmissingancestors
                     object.
                     'common' is a list of revision numbers. If common is not supplied, uses
                     nullrev.
                     """
                     if common is None:
                         common = [nullrev]
                     if rustancestor is not None and self.index.rust_ext_compat:
                         return rustancestor.MissingAncestors(self.index, common)
                     return ancestor.incrementalmissingancestors(self.parentrevs, common)
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     inc = self.incrementalmissingrevs(common=common)
                     return inc.missingancestors(heads)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     inc = self.incrementalmissingrevs(common=common)
                     return [self.node(r) for r in inc.missingancestors(heads)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [self.nullid]  # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return (
                             [self.node(r) for r in self],
                             [self.nullid],
                             list(self.heads()),
                         )
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == self.nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n)  # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update(
                                         [p for p in self.parents(n) if p != self.nullid]
                                     )
                                 elif n in heads:  # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [root for root in roots if root in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(root) for root in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [self.nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [head for head, flag in heads.items() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self, revs=None):
                     if revs is None:
                         try:
                             return self.index.headrevs()
                         except AttributeError:
                             return self._headrevs()
                     if rustdagop is not None and self.index.rust_ext_compat:
                         return rustdagop.headrevs(self.index, revs)
                     return dagop.headrevs(revs, self._uncheckedparentrevs)
                 def computephases(self, roots):
                     return self.index.computephasesmapsets(roots)
                 def _headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     # we won't iter over filtered rev so nobody is a head at start
                     ishead = [0] * (count + 1)
                     index = self.index
                     for r in self:
                         ishead[r] = 1  # I may be an head
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                     return [r for r, val in enumerate(ishead) if val]
                 def _head_node_ids(self):
                     try:
                         return self.index.head_node_ids()
                     except AttributeError:
                         return [self.node(r) for r in self.headrevs()]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [self.nullid]
                         return self._head_node_ids()
                     if start is None:
                         start = nullrev
                     else:
                         start = self.rev(start)
                     stoprevs = {self.rev(n) for n in stop or []}
                     revs = dagop.headrevssubset(
                         self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs
                     )
                     return [self.node(rev) for rev in revs]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     ancs = self._commonancestorsheads(a, b)
                     return pycompat.maplist(self.node, ancs)
                 def _commonancestorsheads(self, *revs):
                     """calculate all the heads of the common ancestors of revs"""
                     try:
                         ancs = self.index.commonancestorsheads(*revs)
                     except (AttributeError, OverflowError):  # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
                     return ancs
                 def isancestor(self, a, b):
                     """return True if node a is an ancestor of node b
                     A revision is considered an ancestor of itself."""
                     a, b = self.rev(a), self.rev(b)
                     return self.isancestorrev(a, b)
                 def isancestorrev(self, a, b):
                     """return True if revision a is an ancestor of revision b
                     A revision is considered an ancestor of itself.
                     The implementation of this is trivial but the use of
                     reachableroots is not."""
                     if a == nullrev:
                         return True
                     elif a == b:
                         return True
                     elif a > b:
                         return False
                     return bool(self.reachableroots(a, [b], [a], includepath=False))
                 def reachableroots(self, minroot, heads, roots, includepath=False):
                     """return (heads(::(<roots> and <roots>::<heads>)))
                     If includepath is True, return (<roots>::<heads>)."""
                     try:
                         return self.index.reachableroots2(
                             minroot, heads, roots, includepath
                         )
                     except AttributeError:
                         return dagop._reachablerootspure(
                             self.parentrevs, minroot, roots, heads, includepath
                         )
                 def ancestor(self, a, b):
                     """calculate the "best" common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)
                     except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
                         return min(map(self.node, ancs))
                     return self.nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == self.nodeconstants.nodelen:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node)  # quick search the index
                             return node
                         except error.LookupError:
                             pass  # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if b"%d" % rev != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 2 * self.nodeconstants.nodelen:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (binascii.Error, error.LookupError):
                             pass
                 def _partialmatch(self, id):
                     # we don't care wdirfilenodeids as they should be always full hash
                     maybewdir = self.nodeconstants.wdirhex.startswith(id)
                     ambiguous = False
                     try:
                         partial = self.index.partialmatch(id)
                         if partial and self.hasnode(partial):
                             if maybewdir:
                                 # single 'ff...' match in radix tree, ambiguous with wdir
                                 ambiguous = True
                             else:
                                 return partial
                         elif maybewdir:
                             # no 'ff...' match in radix tree, wdir identified
                             raise error.WdirUnsupported
                         else:
                             return None
                     except error.RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fast path: for unfiltered changelog, radix tree is accurate
                         if not getattr(self, 'filteredrevs', None):
                             ambiguous = True
                         # fall through to slow path that filters hidden revisions
                     except (AttributeError, ValueError):
                         # we are pure python, or key is not hex
                         pass
                     if ambiguous:
                         raise error.AmbiguousPrefixLookupError(
                             id, self.display_id, _(b'ambiguous identifier')
                         )
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) <= 40:
                         # hex(node)[:...]
                         l = len(id) // 2 * 2  # grab an even number of digits
                         try:
                             # we're dropping the last digit, so let's check that it's hex,
                             # to avoid the expensive computation below if it's not
                             if len(id) % 2 > 0:
                                 if not (id[-1] in hexdigits):
                                     return None
                             prefix = bin(id[:l])
                         except binascii.Error:
                             pass
                         else:
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [
                                 n for n in nl if hex(n).startswith(id) and self.hasnode(n)
                             ]
                             if self.nodeconstants.nullhex.startswith(id):
                                 nl.append(self.nullid)
                             if len(nl) > 0:
                                 if len(nl) == 1 and not maybewdir:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise error.AmbiguousPrefixLookupError(
                                     id, self.display_id, _(b'ambiguous identifier')
                                 )
                             if maybewdir:
                                 raise error.WdirUnsupported
                             return None
                 def lookup(self, id):
                     """locate a node based on:
                     - revision number or str(revision number)
                     - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise error.LookupError(id, self.display_id, _(b'no match found'))
                 def shortest(self, node, minlength=1):
                     """Find the shortest unambiguous prefix that matches node."""
                     def isvalid(prefix):
                         try:
                             matchednode = self._partialmatch(prefix)
                         except error.AmbiguousPrefixLookupError:
                             return False
                         except error.WdirUnsupported:
                             # single 'ff...' match
                             return True
                         if matchednode is None:
                             raise error.LookupError(node, self.display_id, _(b'no node'))
                         return True
                     def maybewdir(prefix):
                         return all(c == b'f' for c in pycompat.iterbytestr(prefix))
                     hexnode = hex(node)
                     def disambiguate(hexnode, minlength):
                         """Disambiguate against wdirid."""
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if not maybewdir(prefix):
                                 return prefix
                     if not getattr(self, 'filteredrevs', None):
                         try:
                             length = max(self.index.shortest(node), minlength)
                             return disambiguate(hexnode, length)
                         except error.RevlogError:
                             if node != self.nodeconstants.wdirid:
                                 raise error.LookupError(
                                     node, self.display_id, _(b'no node')
                                 )
                         except AttributeError:
                             # Fall through to pure code
                             pass
                     if node == self.nodeconstants.wdirid:
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if isvalid(prefix):
                                 return prefix
                     for length in range(minlength, len(hexnode) + 1):
                         prefix = hexnode[:length]
                         if isvalid(prefix):
                             return disambiguate(hexnode, length)
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return storageutil.hashrevisionsha1(text, p1, p2) != node
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self.delta_config.general_delta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     ret = self._inner.issnapshot(rev)
                     self.issnapshot = self._inner.issnapshot
                     return ret
                 def snapshotdepth(self, rev):
                     """number of snapshot in the chain before this one"""
                     if not self.issnapshot(rev):
                         raise error.ProgrammingError(b'revision %d not a snapshot')
                     return len(self._inner._deltachain(rev)[0]) - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions
                     The delta calculated is in binary form and is intended to be written to
                     revlog data directly. So this function needs raw revision data.
                     """
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return bytes(self._inner._chunk(rev2))
                     return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))
                 def revision(self, nodeorrev):
                     """return an uncompressed revision of a given node or revision
                     number.
                     """
                     return self._revisiondata(nodeorrev)
                 def sidedata(self, nodeorrev):
                     """a map of extra data related to the changeset but not part of the hash
                     This function currently return a dictionary. However, more advanced
                     mapping object will likely be used in the future for a more
                     efficient/lazy code.
                     """
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                     else:
                         rev = self.rev(nodeorrev)
                     return self._sidedata(rev)
                 def _rawtext(self, node, rev):
                     """return the possibly unvalidated rawtext for a revision
                     returns (rev, rawtext, validated)
                     """
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._inner._revisioncache:
                         if self._inner._revisioncache[0] == node:
                             return (rev, self._inner._revisioncache[2], True)
                     if rev is None:
                         rev = self.rev(node)
                     return self._inner.raw_text(node, rev)
                 def _revisiondata(self, nodeorrev, raw=False):
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     # fast path the special `nullid` rev
                     if node == self.nullid:
                         return b""
                     # ``rawtext`` is the text as stored inside the revlog. Might be the
                     # revision or might need to be processed to retrieve the revision.
                     rev, rawtext, validated = self._rawtext(node, rev)
                     if raw and validated:
                         # if we don't want to process the raw text and that raw
                         # text is cached, we can exit early.
                         return rawtext
                     if rev is None:
                         rev = self.rev(node)
                     # the revlog's flag for this revision
                     # (usually alter its state or content)
                     flags = self.flags(rev)
                     if validated and flags == REVIDX_DEFAULT_FLAGS:
                         # no extra flags set, no flag processor runs, text = rawtext
                         return rawtext
                     if raw:
                         validatehash = flagutil.processflagsraw(self, rawtext, flags)
                         text = rawtext
                     else:
                         r = flagutil.processflagsread(self, rawtext, flags)
                         text, validatehash = r
                     if validatehash:
                         self.checkhash(text, node, rev=rev)
                     if not validated:
                         self._inner._revisioncache = (node, rev, rawtext)
                     return text
                 def _sidedata(self, rev):
                     """Return the sidedata for a given revision number."""
                     sidedata_end = None
                     if self._docket is not None:
                         sidedata_end = self._docket.sidedata_end
                     return self._inner.sidedata(rev, sidedata_end)
                 def rawdata(self, nodeorrev):
                     """return an uncompressed raw data of a given node or revision number."""
                     return self._revisiondata(nodeorrev, raw=True)
                 def hash(self, text, p1, p2):
                     """Compute a node hash.
                     Available as a function so that subclasses can replace the hash
                     as needed.
                     """
                     return storageutil.hashrevisionsha1(text, p1, p2)
                 def checkhash(self, text, node, p1=None, p2=None, rev=None):
                     """Check node hash integrity.
                     Available as a function so that subclasses can extend hash mismatch
                     behaviors as needed.
                     """
                     try:
                         if p1 is None and p2 is None:
                             p1, p2 = self.parents(node)
                         if node != self.hash(text, p1, p2):
                             # Clear the revision cache on hash failure. The revision cache
                             # only stores the raw revision and clearing the cache does have
                             # the side-effect that we won't have a cache hit when the raw
                             # revision data is accessed. But this case should be rare and
                             # it is extra work to teach the cache about the hash
                             # verification state.
                             if (
                                 self._inner._revisioncache
                                 and self._inner._revisioncache[0] == node
                             ):
                                 self._inner._revisioncache = None
                             revornode = rev
                             if revornode is None:
                                 revornode = templatefilters.short(hex(node))
                             raise error.RevlogError(
                                 _(b"integrity check failed on %s:%s")
                                 % (self.display_id, pycompat.bytestr(revornode))
                             )
                     except error.RevlogError:
                         if self.feature_config.censorable and storageutil.iscensoredtext(
                             text
                         ):
                             raise error.CensoredNodeError(self.display_id, node, text)
                         raise
                 @property
                 def _split_index_file(self):
                     """the path where to expect the index of an ongoing splitting operation
                     The file will only exist if a splitting operation is in progress, but
                     it is always expected at the same location."""
                     parts = self.radix.split(b'/')
                     if len(parts) > 1:
                         # adds a '-s' prefix to the ``data/` or `meta/` base
                         head = parts[0] + b'-s'
                         mids = parts[1:-1]
                         tail = parts[-1] + b'.i'
                         pieces = [head] + mids + [tail]
                         return b'/'.join(pieces)
                     else:
                         # the revlog is stored at the root of the store (changelog or
                         # manifest), no risk of collision.
                         return self.radix + b'.i.s'
-                def _enforceinlinesize(self, tr, side_write=True):
+                def _enforceinlinesize(self, tr):
                     """Check if the revlog is too big for inline and convert if so.
                     This should be called after revisions are added to the revlog. If the
                     revlog has grown too large to be an inline revlog, it will convert it
                     to use multiple index and data files.
                     """
                     tiprev = len(self) - 1
                     total_size = self.start(tiprev) + self.length(tiprev)
                     if not self._inline or (self._may_inline and total_size < _maxinline):
                         return
                     if self._docket is not None:
                         msg = b"inline revlog should not have a docket"
                         raise error.ProgrammingError(msg)
                     # In the common case, we enforce inline size because the revlog has
                     # been appened too. And in such case, it must have an initial offset
                     # recorded in the transaction.
                     troffset = tr.findoffset(self._inner.canonical_index_file)
                     pre_touched = troffset is not None
                     if not pre_touched and self.target[0] != KIND_CHANGELOG:
                         raise error.RevlogError(
                             _(b"%s not found in the transaction") % self._indexfile
                         )
                     tr.addbackup(self._inner.canonical_index_file, for_offset=pre_touched)
                     tr.add(self._datafile, 0)
                     new_index_file_path = None
-                    if side_write:
+                    old_index_file_path = self._indexfile
-                        old_index_file_path = self._indexfile
+                    new_index_file_path = self._split_index_file
-                        new_index_file_path = self._split_index_file
+                    opener = self.opener
-                        opener = self.opener
+                    weak_self = weakref.ref(self)
-                        weak_self = weakref.ref(self)
+                    # the "split" index replace the real index when the transaction is
-                        # the "split" index replace the real index when the transaction is
+                    # finalized
-                        # finalized
+                    def finalize_callback(tr):
-                        def finalize_callback(tr):
+                        opener.rename(
-                            opener.rename(
+                            new_index_file_path,
-                                new_index_file_path,
+                            old_index_file_path,
-                                old_index_file_path,
+                            checkambig=True,
-                                checkambig=True,
+                        maybe_self = weak_self()
-                            maybe_self = weak_self()
+                        if maybe_self is not None:
-                            if maybe_self is not None:
+                            maybe_self._indexfile = old_index_file_path
-                                maybe_self._indexfile = old_index_file_path
+                            maybe_self._inner.index_file = maybe_self._indexfile
-                                maybe_self._inner.index_file = maybe_self._indexfile
+                    def abort_callback(tr):
-                        def abort_callback(tr):
+                        maybe_self = weak_self()
-                            maybe_self = weak_self()
+                        if maybe_self is not None:
-                            if maybe_self is not None:
+                            maybe_self._indexfile = old_index_file_path
-                                maybe_self._indexfile = old_index_file_path
+                            maybe_self._inner.inline = True
-                                maybe_self._inner.inline = True
+                            maybe_self._inner.index_file = old_index_file_path
-                                maybe_self._inner.index_file = old_index_file_path
+                    tr.registertmp(new_index_file_path)
-                        tr.registertmp(new_index_file_path)
+                    if self.target[1] is not None:
-                        if self.target[1] is not None:
+                        callback_id = b'000-revlog-split-%d-%s' % self.target
-                            callback_id = b'000-revlog-split-%d-%s' % self.target
+                    else:
-                        else:
+                        callback_id = b'000-revlog-split-%d' % self.target[0]
-                            callback_id = b'000-revlog-split-%d' % self.target[0]
+                    tr.addfinalize(callback_id, finalize_callback)
-                        tr.addfinalize(callback_id, finalize_callback)
+                    tr.addabort(callback_id, abort_callback)
-                        tr.addabort(callback_id, abort_callback)
                     self._format_flags &= ~FLAG_INLINE_DATA
                     self._inner.split_inline(
                         tr,
                         self._format_flags | self._format_version,
                         new_index_file_path=new_index_file_path,
                     )
                     self._inline = False
                     if new_index_file_path is not None:
                         self._indexfile = new_index_file_path
                     nodemaputil.setup_persistent_nodemap(tr, self)
                 def _nodeduplicatecallback(self, transaction, node):
                     """called when trying to add a node already stored."""
                 @contextlib.contextmanager
                 def reading(self):
                     with self._inner.reading():
                         yield
                 @contextlib.contextmanager
                 def _writing(self, transaction):
                     if self._trypending:
                         msg = b'try to write in a `trypending` revlog: %s'
                         msg %= self.display_id
                         raise error.ProgrammingError(msg)
                     if self._inner.is_writing:
                         yield
                     else:
                         data_end = None
                         sidedata_end = None
                         if self._docket is not None:
                             data_end = self._docket.data_end
                             sidedata_end = self._docket.sidedata_end
                         with self._inner.writing(
                             transaction,
                             data_end=data_end,
                             sidedata_end=sidedata_end,
                         ):
                             yield
                             if self._docket is not None:
                                 self._write_docket(transaction)
                 @property
                 def is_delaying(self):
                     return self._inner.is_delaying
                 def _write_docket(self, transaction):
                     """write the current docket on disk
                     Exist as a method to help changelog to implement transaction logic
                     We could also imagine using the same transaction logic for all revlog
                     since docket are cheap."""
                     self._docket.write(transaction)
                 def addrevision(
                     self,
                     text,
                     transaction,
                     link,
                     p1,
                     p2,
                     cachedelta=None,
                     node=None,
                     flags=REVIDX_DEFAULT_FLAGS,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     flags - the known flags to set on the revision
                     deltacomputer - an optional deltacomputer instance shared between
                         multiple calls
                     """
                     if link == nullrev:
                         raise error.RevlogError(
                             _(b"attempted to add linkrev -1 to %s") % self.display_id
                         )
                     if sidedata is None:
                         sidedata = {}
                     elif sidedata and not self.feature_config.has_side_data:
                         raise error.ProgrammingError(
                             _(b"trying to add sidedata to a revlog who don't support them")
                         )
                     if flags:
                         node = node or self.hash(text, p1, p2)
                     rawtext, validatehash = flagutil.processflagswrite(self, text, flags)
                     # If the flag processor modifies the revision data, ignore any provided
                     # cachedelta.
                     if rawtext != text:
                         cachedelta = None
                     if len(rawtext) > _maxentrysize:
                         raise error.RevlogError(
                             _(
                                 b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"
                             )
                             % (self.display_id, len(rawtext))
                         )
                     node = node or self.hash(rawtext, p1, p2)
                     rev = self.index.get_rev(node)
                     if rev is not None:
                         return rev
                     if validatehash:
                         self.checkhash(rawtext, node, p1=p1, p2=p2)
                     return self.addrawrevision(
                         rawtext,
                         transaction,
                         link,
                         p1,
                         p2,
                         node,
                         flags,
                         cachedelta=cachedelta,
                         deltacomputer=deltacomputer,
                         sidedata=sidedata,
                     )
                 def addrawrevision(
                     self,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     node,
                     flags,
                     cachedelta=None,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a raw revision with known flags, node and parents
                     useful when reusing a revision not stored in this revlog (ex: received
                     over wire, or read from an external bundle).
                     """
                     with self._writing(transaction):
                         return self._addrevision(
                             node,
                             rawtext,
                             transaction,
                             link,
                             p1,
                             p2,
                             flags,
                             cachedelta,
                             deltacomputer=deltacomputer,
                             sidedata=sidedata,
                         )
                 def compress(self, data):
                     return self._inner.compress(data)
                 def decompress(self, data):
                     return self._inner.decompress(data)
                 def _addrevision(
                     self,
                     node,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     flags,
                     cachedelta,
                     alwayscache=False,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
                     if "deltacomputer" is not provided or None, a defaultdeltacomputer will
                     be used.
                     invariants:
                     - rawtext is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     if node == self.nullid:
                         raise error.RevlogError(
                             _(b"%s: attempt to add null revision") % self.display_id
                         )
                     if (
                         node == self.nodeconstants.wdirid
                         or node in self.nodeconstants.wdirfilenodeids
                     ):
                         raise error.RevlogError(
                             _(b"%s: attempt to add wdir revision") % self.display_id
                         )
                     if self._inner._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     btext = [rawtext]
                     curr = len(self)
                     prev = curr - 1
                     offset = self._get_data_offset(prev)
                     if self._concurrencychecker:
                         ifh, dfh, sdfh = self._inner._writinghandles
                         # XXX no checking for the sidedata file
                         if self._inline:
                             # offset is "as if" it were in the .d file, so we need to add on
                             # the size of the entry metadata.
                             self._concurrencychecker(
                                 ifh, self._indexfile, offset + curr * self.index.entry_size
                             )
                         else:
                             # Entries in the .i are a consistent size.
                             self._concurrencychecker(
                                 ifh, self._indexfile, curr * self.index.entry_size
                             )
                             self._concurrencychecker(dfh, self._datafile, offset)
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if rawtext is None:
                         # need rawtext size, before changed by flag processors, which is
                         # the non-raw size. use revlog explicitly to avoid filelog's extra
                         # logic that might remove metadata size.
                         textlen = mdiff.patchedsize(
                             revlog.size(self, cachedelta[0]), cachedelta[1]
                         )
                     else:
                         textlen = len(rawtext)
                     if deltacomputer is None:
                         write_debug = None
                         if self.delta_config.debug_delta:
                             write_debug = transaction._report
                         deltacomputer = deltautil.deltacomputer(
                             self, write_debug=write_debug
                         )
                     if cachedelta is not None and len(cachedelta) == 2:
                         # If the cached delta has no information about how it should be
                         # reused, add the default reuse instruction according to the
                         # revlog's configuration.
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse = DELTA_BASE_REUSE_NO
                         cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)
                     revinfo = revlogutils.revisioninfo(
                         node,
                         p1,
                         p2,
                         btext,
                         textlen,
                         cachedelta,
                         flags,
                     )
                     deltainfo = deltacomputer.finddeltainfo(revinfo)
                     compression_mode = COMP_MODE_INLINE
                     if self._docket is not None:
                         default_comp = self._docket.default_compression_header
                         r = deltautil.delta_compression(default_comp, deltainfo)
                         compression_mode, deltainfo = r
                     sidedata_compression_mode = COMP_MODE_INLINE
                     if sidedata and self.feature_config.has_side_data:
                         sidedata_compression_mode = COMP_MODE_PLAIN
                         serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)
                         sidedata_offset = self._docket.sidedata_end
                         h, comp_sidedata = self._inner.compress(serialized_sidedata)
                         if (
                             h != b'u'
                             and comp_sidedata[0:1] != b'\0'
                             and len(comp_sidedata) < len(serialized_sidedata)
                         ):
                             assert not h
                             if (
                                 comp_sidedata[0:1]
                                 == self._docket.default_compression_header
                             ):
                                 sidedata_compression_mode = COMP_MODE_DEFAULT
                                 serialized_sidedata = comp_sidedata
                             else:
                                 sidedata_compression_mode = COMP_MODE_INLINE
                                 serialized_sidedata = comp_sidedata
                     else:
                         serialized_sidedata = b""
                         # Don't store the offset if the sidedata is empty, that way
                         # we can easily detect empty sidedata and they will be no different
                         # than ones we manually add.
                         sidedata_offset = 0
                     rank = RANK_UNKNOWN
                     if self.feature_config.compute_rank:
                         if (p1r, p2r) == (nullrev, nullrev):
                             rank = 1
                         elif p1r != nullrev and p2r == nullrev:
                             rank = 1 + self.fast_rank(p1r)
                         elif p1r == nullrev and p2r != nullrev:
                             rank = 1 + self.fast_rank(p2r)
                         else:  # merge node
                             if rustdagop is not None and self.index.rust_ext_compat:
                                 rank = rustdagop.rank(self.index, p1r, p2r)
                             else:
                                 pmin, pmax = sorted((p1r, p2r))
                                 rank = 1 + self.fast_rank(pmax)
                                 rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))
                     e = revlogutils.entry(
                         flags=flags,
                         data_offset=offset,
                         data_compressed_length=deltainfo.deltalen,
                         data_uncompressed_length=textlen,
                         data_compression_mode=compression_mode,
                         data_delta_base=deltainfo.base,
                         link_rev=link,
                         parent_rev_1=p1r,
                         parent_rev_2=p2r,
                         node_id=node,
                         sidedata_offset=sidedata_offset,
                         sidedata_compressed_length=len(serialized_sidedata),
                         sidedata_compression_mode=sidedata_compression_mode,
                         rank=rank,
                     )
                     self.index.append(e)
                     entry = self.index.entry_binary(curr)
                     if curr == 0 and self._docket is None:
                         header = self._format_flags | self._format_version
                         header = self.index.pack_header(header)
                         entry = header + entry
                     self._writeentry(
                         transaction,
                         entry,
                         deltainfo.data,
                         link,
                         offset,
                         serialized_sidedata,
                         sidedata_offset,
                     )
                     rawtext = btext[0]
                     if alwayscache and rawtext is None:
                         rawtext = deltacomputer.buildtext(revinfo)
                     if type(rawtext) == bytes:  # only accept immutable objects
                         self._inner._revisioncache = (node, curr, rawtext)
                     self._chainbasecache[curr] = deltainfo.chainbase
                     return curr
                 def _get_data_offset(self, prev):
                     """Returns the current offset in the (in-transaction) data file.
                     Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket
                     file to store that information: since sidedata can be rewritten to the
                     end of the data file within a transaction, you can have cases where, for
                     example, rev `n` does not have sidedata while rev `n - 1` does, leading
                     to `n - 1`'s sidedata being written after `n`'s data.
                     TODO cache this in a docket file before getting out of experimental."""
                     if self._docket is None:
                         return self.end(prev)
                     else:
                         return self._docket.data_end
                 def _writeentry(
                     self,
                     transaction,
                     entry,
                     data,
                     link,
                     offset,
                     sidedata,
                     sidedata_offset,
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     index_end = data_end = sidedata_end = None
                     if self._docket is not None:
                         index_end = self._docket.index_end
                         data_end = self._docket.data_end
                         sidedata_end = self._docket.sidedata_end
                     files_end = self._inner.write_entry(
                         transaction,
                         entry,
                         data,
                         link,
                         offset,
                         sidedata,
                         sidedata_offset,
                         index_end,
                         data_end,
                         sidedata_end,
                     )
                     self._enforceinlinesize(transaction)
                     if self._docket is not None:
                         self._docket.index_end = files_end[0]
                         self._docket.data_end = files_end[1]
                         self._docket.sidedata_end = files_end[2]
                     nodemaputil.setup_persistent_nodemap(transaction, self)
                 def addgroup(
                     self,
                     deltas,
                     linkmapper,
                     transaction,
                     alwayscache=False,
                     addrevisioncb=None,
                     duplicaterevisioncb=None,
                     debug_info=None,
                     delta_base_reuse_policy=None,
                 ):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     If ``addrevisioncb`` is defined, it will be called with arguments of
                     this revlog and the node that was added.
                     """
                     if self._adding_group:
                         raise error.ProgrammingError(b'cannot nest addgroup() calls')
                     # read the default delta-base reuse policy from revlog config if the
                     # group did not specify one.
                     if delta_base_reuse_policy is None:
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse_policy = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse_policy = DELTA_BASE_REUSE_NO
                     self._adding_group = True
                     empty = True
                     try:
                         with self._writing(transaction):
                             write_debug = None
                             if self.delta_config.debug_delta:
                                 write_debug = transaction._report
                             deltacomputer = deltautil.deltacomputer(
                                 self,
                                 write_debug=write_debug,
                                 debug_info=debug_info,
                             )
                             # loop through our set of deltas
                             for data in deltas:
                                 (
                                     node,
                                     p1,
                                     p2,
                                     linknode,
                                     deltabase,
                                     delta,
                                     flags,
                                     sidedata,
                                 ) = data
                                 link = linkmapper(linknode)
                                 flags = flags or REVIDX_DEFAULT_FLAGS
                                 rev = self.index.get_rev(node)
                                 if rev is not None:
                                     # this can happen if two branches make the same change
                                     self._nodeduplicatecallback(transaction, rev)
                                     if duplicaterevisioncb:
                                         duplicaterevisioncb(self, rev)
                                     empty = False
                                     continue
                                 for p in (p1, p2):
                                     if not self.index.has_node(p):
                                         raise error.LookupError(
                                             p, self.radix, _(b'unknown parent')
                                         )
                                 if not self.index.has_node(deltabase):
                                     raise error.LookupError(
                                         deltabase, self.display_id, _(b'unknown delta base')
                                     )
                                 baserev = self.rev(deltabase)
                                 if baserev != nullrev and self.iscensored(baserev):
                                     # if base is censored, delta must be full replacement in a
                                     # single patch operation
                                     hlen = struct.calcsize(b">lll")
                                     oldlen = self.rawsize(baserev)
                                     newlen = len(delta) - hlen
                                     if delta[:hlen] != mdiff.replacediffheader(
                                         oldlen, newlen
                                     ):
                                         raise error.CensoredBaseError(
                                             self.display_id, self.node(baserev)
                                         )
                                 if not flags and self._peek_iscensored(baserev, delta):
                                     flags |= REVIDX_ISCENSORED
                                 # We assume consumers of addrevisioncb will want to retrieve
                                 # the added revision, which will require a call to
                                 # revision(). revision() will fast path if there is a cache
                                 # hit. So, we tell _addrevision() to always cache in this case.
                                 # We're only using addgroup() in the context of changegroup
                                 # generation so the revision data can always be handled as raw
                                 # by the flagprocessor.
                                 rev = self._addrevision(
                                     node,
                                     None,
                                     transaction,
                                     link,
                                     p1,
                                     p2,
                                     flags,
                                     (baserev, delta, delta_base_reuse_policy),
                                     alwayscache=alwayscache,
                                     deltacomputer=deltacomputer,
                                     sidedata=sidedata,
                                 )
                                 if addrevisioncb:
                                     addrevisioncb(self, rev)
                                 empty = False
                     finally:
                         self._adding_group = False
                     return not empty
                 def iscensored(self, rev):
                     """Check if a file revision is censored."""
                     if not self.feature_config.censorable:
                         return False
                     return self.flags(rev) & REVIDX_ISCENSORED
                 def _peek_iscensored(self, baserev, delta):
                     """Quickly check if a delta produces a censored revision."""
                     if not self.feature_config.censorable:
                         return False
                     return storageutil.deltaiscensored(delta, baserev, self.rawsize)
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     return storageutil.resolvestripinfo(
                         minlink,
                         len(self) - 1,
                         self.headrevs(),
                         self.linkrev,
                         self.parentrevs,
                     )
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     data_end = self.start(rev)
                     if not self._inline:
                         transaction.add(self._datafile, data_end)
                         end = rev * self.index.entry_size
                     else:
                         end = data_end + (rev * self.index.entry_size)
                     if self._sidedatafile:
                         sidedata_end = self.sidedata_cut_off(rev)
                         transaction.add(self._sidedatafile, sidedata_end)
                     transaction.add(self._indexfile, end)
                     if self._docket is not None:
                         # XXX we could, leverage the docket while stripping. However it is
                         # not powerfull enough at the time of this comment
                         self._docket.index_end = end
                         self._docket.data_end = data_end
                         self._docket.sidedata_end = sidedata_end
                         self._docket.write(transaction, stripping=True)
                     # then reset internal state in memory to forget those revisions
                     self._chaininfocache = util.lrucachedict(500)
                     self._inner.clear_cache()
                     del self.index[rev:-1]
                 def checksize(self):
                     """Check size of index and data files
                     return a (dd, di) tuple.
                     - dd: extra bytes for the "data" file
                     - di: extra bytes for the "index" file
                     A healthy revlog will return (0, 0).
                     """
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         with self._datafp() as f:
                             f.seek(0, io.SEEK_END)
                             actual = f.tell()
                         dd = actual - expected
                     except FileNotFoundError:
                         dd = 0
                     try:
                         f = self.opener(self._indexfile)
                         f.seek(0, io.SEEK_END)
                         actual = f.tell()
                         f.close()
                         s = self.index.entry_size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except FileNotFoundError:
                         di = 0
                     return (dd, di)
                 def files(self):
                     """return list of files that compose this revlog"""
                     res = [self._indexfile]
                     if self._docket_file is None:
                         if not self._inline:
                             res.append(self._datafile)
                     else:
                         res.append(self._docket_file)
                         res.extend(self._docket.old_index_filepaths(include_empty=False))
                         if self._docket.data_end:
                             res.append(self._datafile)
                         res.extend(self._docket.old_data_filepaths(include_empty=False))
                         if self._docket.sidedata_end:
                             res.append(self._sidedatafile)
                         res.extend(self._docket.old_sidedata_filepaths(include_empty=False))
                     return res
                 def emitrevisions(
                     self,
                     nodes,
                     nodesorder=None,
                     revisiondata=False,
                     assumehaveparentrevisions=False,
                     deltamode=repository.CG_DELTAMODE_STD,
                     sidedata_helpers=None,
                     debug_info=None,
                 ):
                     if nodesorder not in (b'nodes', b'storage', b'linear', None):
                         raise error.ProgrammingError(
                             b'unhandled value for nodesorder: %s' % nodesorder
                         )
                     if nodesorder is None and not self.delta_config.general_delta:
                         nodesorder = b'storage'
                     if (
                         not self._storedeltachains
                         and deltamode != repository.CG_DELTAMODE_PREV
                     ):
                         deltamode = repository.CG_DELTAMODE_FULL
                     return storageutil.emitrevisions(
                         self,
                         nodes,
                         nodesorder,
                         revlogrevisiondelta,
                         deltaparentfn=self.deltaparent,
                         candeltafn=self._candelta,
                         rawsizefn=self.rawsize,
                         revdifffn=self.revdiff,
                         flagsfn=self.flags,
                         deltamode=deltamode,
                         revisiondata=revisiondata,
                         assumehaveparentrevisions=assumehaveparentrevisions,
                         sidedata_helpers=sidedata_helpers,
                         debug_info=debug_info,
                     )
                 DELTAREUSEALWAYS = b'always'
                 DELTAREUSESAMEREVS = b'samerevs'
                 DELTAREUSENEVER = b'never'
                 DELTAREUSEFULLADD = b'fulladd'
                 DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}
                 def clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb=None,
                     deltareuse=DELTAREUSESAMEREVS,
                     forcedeltabothparents=None,
                     sidedata_helpers=None,
                 ):
                     """Copy this revlog to another, possibly with format changes.
                     The destination revlog will contain the same revisions and nodes.
                     However, it may not be bit-for-bit identical due to e.g. delta encoding
                     differences.
                     The ``deltareuse`` argument control how deltas from the existing revlog
                     are preserved in the destination revlog. The argument can have the
                     following values:
                     DELTAREUSEALWAYS
                        Deltas will always be reused (if possible), even if the destination
                        revlog would not select the same revisions for the delta. This is the
                        fastest mode of operation.
                     DELTAREUSESAMEREVS
                        Deltas will be reused if the destination revlog would pick the same
                        revisions for the delta. This mode strikes a balance between speed
                        and optimization.
                     DELTAREUSENEVER
                        Deltas will never be reused. This is the slowest mode of execution.
                        This mode can be used to recompute deltas (e.g. if the diff/delta
                        algorithm changes).
                     DELTAREUSEFULLADD
                        Revision will be re-added as if their were new content. This is
                        slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.
                        eg: large file detection and handling.
                     Delta computation can be slow, so the choice of delta reuse policy can
                     significantly affect run time.
                     The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
                     two extremes. Deltas will be reused if they are appropriate. But if the
                     delta could choose a better revision, it will do so. This means if you
                     are converting a non-generaldelta revlog to a generaldelta revlog,
                     deltas will be recomputed if the delta's parent isn't a parent of the
                     revision.
                     In addition to the delta policy, the ``forcedeltabothparents``
                     argument controls whether to force compute deltas against both parents
                     for merges. By default, the current default is used.
                     See `revlogutil.sidedata.get_sidedata_helpers` for the doc on
                     `sidedata_helpers`.
                     """
                     if deltareuse not in self.DELTAREUSEALL:
                         raise ValueError(
                             _(b'value for deltareuse invalid: %s') % deltareuse
                         )
                     if len(destrevlog):
                         raise ValueError(_(b'destination revlog is not empty'))
                     if getattr(self, 'filteredrevs', None):
                         raise ValueError(_(b'source revlog has filtered revisions'))
                     if getattr(destrevlog, 'filteredrevs', None):
                         raise ValueError(_(b'destination revlog has filtered revisions'))
                     # lazydelta and lazydeltabase controls whether to reuse a cached delta,
                     # if possible.
                     old_delta_config = destrevlog.delta_config
                     destrevlog.delta_config = destrevlog.delta_config.copy()
                     try:
                         if deltareuse == self.DELTAREUSEALWAYS:
                             destrevlog.delta_config.lazy_delta_base = True
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSESAMEREVS:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSENEVER:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = False
                         delta_both_parents = (
                             forcedeltabothparents or old_delta_config.delta_both_parents
                         )
                         destrevlog.delta_config.delta_both_parents = delta_both_parents
                         with self.reading(), destrevlog._writing(tr):
                             self._clone(
                                 tr,
                                 destrevlog,
                                 addrevisioncb,
                                 deltareuse,
                                 forcedeltabothparents,
                                 sidedata_helpers,
                             )
                     finally:
                         destrevlog.delta_config = old_delta_config
                 def _clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb,
                     deltareuse,
                     forcedeltabothparents,
                     sidedata_helpers,
                 ):
                     """perform the core duty of `revlog.clone` after parameter processing"""
                     write_debug = None
                     if self.delta_config.debug_delta:
                         write_debug = tr._report
                     deltacomputer = deltautil.deltacomputer(
                         destrevlog,
                         write_debug=write_debug,
                     )
                     index = self.index
                     for rev in self:
                         entry = index[rev]
                         # Some classes override linkrev to take filtered revs into
                         # account. Use raw entry from index.
                         flags = entry[0] & 0xFFFF
                         linkrev = entry[4]
                         p1 = index[entry[5]][7]
                         p2 = index[entry[6]][7]
                         node = entry[7]
                         # (Possibly) reuse the delta from the revlog if allowed and
                         # the revlog chunk is a delta.
                         cachedelta = None
                         rawtext = None
                         if deltareuse == self.DELTAREUSEFULLADD:
                             text = self._revisiondata(rev)
                             sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             destrevlog.addrevision(
                                 text,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 cachedelta=cachedelta,
                                 node=node,
                                 flags=flags,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         else:
                             if destrevlog.delta_config.lazy_delta:
                                 dp = self.deltaparent(rev)
                                 if dp != nullrev:
                                     cachedelta = (dp, bytes(self._inner._chunk(rev)))
                             sidedata = None
                             if not cachedelta:
                                 try:
                                     rawtext = self._revisiondata(rev)
                                 except error.CensoredNodeError as censored:
                                     assert flags & REVIDX_ISCENSORED
                                     rawtext = censored.tombstone
                                 sidedata = self.sidedata(rev)
                             if sidedata is None:
                                 sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             destrevlog._addrevision(
                                 node,
                                 rawtext,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 flags,
                                 cachedelta,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         if addrevisioncb:
                             addrevisioncb(self, rev, node)
                 def censorrevision(self, tr, censor_nodes, tombstone=b''):
                     if self._format_version == REVLOGV0:
                         raise error.RevlogError(
                             _(b'cannot censor with version %d revlogs')
                             % self._format_version
                         )
                     elif self._format_version == REVLOGV1:
                         rewrite.v1_censor(self, tr, censor_nodes, tombstone)
                     else:
                         rewrite.v2_censor(self, tr, censor_nodes, tombstone)
                 def verifyintegrity(self, state):
                     """Verifies the integrity of the revlog.
                     Yields ``revlogproblem`` instances describing problems that are
                     found.
                     """
                     dd, di = self.checksize()
                     if dd:
                         yield revlogproblem(error=_(b'data length off by %d bytes') % dd)
                     if di:
                         yield revlogproblem(error=_(b'index contains %d extra bytes') % di)
                     version = self._format_version
                     # The verifier tells us what version revlog we should be.
                     if version != state[b'expectedversion']:
                         yield revlogproblem(
                             warning=_(b"warning: '%s' uses revlog format %d; expected %d")
                             % (self.display_id, version, state[b'expectedversion'])
                         )
                     state[b'skipread'] = set()
                     state[b'safe_renamed'] = set()
                     for rev in self:
                         node = self.node(rev)
                         # Verify contents. 4 cases to care about:
                         #
                         #   common: the most common case
                         #   rename: with a rename
                         #   meta: file content starts with b'\1\n', the metadata
                         #         header defined in filelog.py, but without a rename
                         #   ext: content stored externally
                         #
                         # More formally, their differences are shown below:
                         #
                         #                       | common | rename | meta  | ext
                         #  -------------------------------------------------------
                         #   flags()             | 0      | 0      | 0     | not 0
                         #   renamed()           | False  | True   | False | ?
                         #   rawtext[0:2]=='\1\n'| False  | True   | True  | ?
                         #
                         # "rawtext" means the raw text stored in revlog data, which
                         # could be retrieved by "rawdata(rev)". "text"
                         # mentioned below is "revision(rev)".
                         #
                         # There are 3 different lengths stored physically:
                         #  1. L1: rawsize, stored in revlog index
                         #  2. L2: len(rawtext), stored in revlog data
                         #  3. L3: len(text), stored in revlog data if flags==0, or
                         #     possibly somewhere else if flags!=0
                         #
                         # L1 should be equal to L2. L3 could be different from them.
                         # "text" may or may not affect commit hash depending on flag
                         # processors (see flagutil.addflagprocessor).
                         #
                         #              | common  | rename | meta  | ext
                         # -------------------------------------------------
                         #    rawsize() | L1      | L1     | L1    | L1
                         #       size() | L1      | L2-LM  | L1(*) | L1 (?)
                         # len(rawtext) | L2      | L2     | L2    | L2
                         #    len(text) | L2      | L2     | L2    | L3
                         #  len(read()) | L2      | L2-LM  | L2-LM | L3 (?)
                         #
                         # LM:  length of metadata, depending on rawtext
                         # (*): not ideal, see comment in filelog.size
                         # (?): could be "- len(meta)" if the resolved content has
                         #      rename metadata
                         #
                         # Checks needed to be done:
                         #  1. length check: L1 == L2, in all cases.
                         #  2. hash check: depending on flag processor, we may need to
                         #     use either "text" (external), or "rawtext" (in revlog).
                         try:
                             skipflags = state.get(b'skipflags', 0)
                             if skipflags:
                                 skipflags &= self.flags(rev)
                             _verify_revision(self, skipflags, state, node)
                             l1 = self.rawsize(rev)
                             l2 = len(self.rawdata(node))
                             if l1 != l2:
                                 yield revlogproblem(
                                     error=_(b'unpacked size is %d, %d expected') % (l2, l1),
                                     node=node,
                                 )
                         except error.CensoredNodeError:
                             if state[b'erroroncensored']:
                                 yield revlogproblem(
                                     error=_(b'censored file data'), node=node
                                 )
                                 state[b'skipread'].add(node)
                         except Exception as e:
                             yield revlogproblem(
                                 error=_(b'unpacking %s: %s')
                                 % (short(node), stringutil.forcebytestr(e)),
                                 node=node,
                             )
                             state[b'skipread'].add(node)
                 def storageinfo(
                     self,
                     exclusivefiles=False,
                     sharedfiles=False,
                     revisionscount=False,
                     trackedsize=False,
                     storedsize=False,
                 ):
                     d = {}
                     if exclusivefiles:
                         d[b'exclusivefiles'] = [(self.opener, self._indexfile)]
                         if not self._inline:
                             d[b'exclusivefiles'].append((self.opener, self._datafile))
                     if sharedfiles:
                         d[b'sharedfiles'] = []
                     if revisionscount:
                         d[b'revisionscount'] = len(self)
                     if trackedsize:
                         d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))
                     if storedsize:
                         d[b'storedsize'] = sum(
                             self.opener.stat(path).st_size for path in self.files()
                         )
                     return d
                 def rewrite_sidedata(self, transaction, helpers, startrev, endrev):
                     if not self.feature_config.has_side_data:
                         return
                     # revlog formats with sidedata support does not support inline
                     assert not self._inline
                     if not helpers[1] and not helpers[2]:
                         # Nothing to generate or remove
                         return
                     new_entries = []
                     # append the new sidedata
                     with self._writing(transaction):
                         ifh, dfh, sdfh = self._inner._writinghandles
                         dfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                         current_offset = sdfh.tell()
                         for rev in range(startrev, endrev + 1):
                             entry = self.index[rev]
                             new_sidedata, flags = sidedatautil.run_sidedata_helpers(
                                 store=self,
                                 sidedata_helpers=helpers,
                                 sidedata={},
                                 rev=rev,
                             )
                             serialized_sidedata = sidedatautil.serialize_sidedata(
                                 new_sidedata
                             )
                             sidedata_compression_mode = COMP_MODE_INLINE
                             if serialized_sidedata and self.feature_config.has_side_data:
                                 sidedata_compression_mode = COMP_MODE_PLAIN
                                 h, comp_sidedata = self._inner.compress(serialized_sidedata)
                                 if (
                                     h != b'u'
                                     and comp_sidedata[0] != b'\0'
                                     and len(comp_sidedata) < len(serialized_sidedata)
                                 ):
                                     assert not h
                                     if (
                                         comp_sidedata[0]
                                         == self._docket.default_compression_header
                                     ):
                                         sidedata_compression_mode = COMP_MODE_DEFAULT
                                         serialized_sidedata = comp_sidedata
                                     else:
                                         sidedata_compression_mode = COMP_MODE_INLINE
                                         serialized_sidedata = comp_sidedata
                             if entry[8] != 0 or entry[9] != 0:
                                 # rewriting entries that already have sidedata is not
                                 # supported yet, because it introduces garbage data in the
                                 # revlog.
                                 msg = b"rewriting existing sidedata is not supported yet"
                                 raise error.Abort(msg)
                             # Apply (potential) flags to add and to remove after running
                             # the sidedata helpers
                             new_offset_flags = entry[0] | flags[0] & ~flags[1]
                             entry_update = (
                                 current_offset,
                                 len(serialized_sidedata),
                                 new_offset_flags,
                                 sidedata_compression_mode,
                             )
                             # the sidedata computation might have move the file cursors around
                             sdfh.seek(current_offset, os.SEEK_SET)
                             sdfh.write(serialized_sidedata)
                             new_entries.append(entry_update)
                             current_offset += len(serialized_sidedata)
                             self._docket.sidedata_end = sdfh.tell()
                         # rewrite the new index entries
                         ifh.seek(startrev * self.index.entry_size)
                         for i, e in enumerate(new_entries):
                             rev = startrev + i
                             self.index.replace_sidedata_info(rev, *e)
                             packed = self.index.entry_binary(rev)
                             if rev == 0 and self._docket is None:
                                 header = self._format_flags | self._format_version
                                 header = self.index.pack_header(header)
                                 packed = header + packed
                             ifh.write(packed)