upstream/mercurial-mirror Commit - r51998:af96fbb8

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

# coding: utf8

2

# coding: utf8

3

#

3

#

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

"""Storage back-end for Mercurial.

9

"""Storage back-end for Mercurial.

10

11

This provides efficient delta storage with O(1) retrieve and append

11

This provides efficient delta storage with O(1) retrieve and append

12

and O(changes) merge between branches.

12

and O(changes) merge between branches.

13

"""

13

"""

14

15

16

import binascii

16

import binascii

17

import collections

17

import collections

18

import contextlib

18

import contextlib

19

import io

19

import io

20

import os

20

import os

21

import struct

21

import struct

22

import weakref

22

import weakref

23

import zlib

23

import zlib

24

25

# import stuff from node for others to import from revlog

25

# import stuff from node for others to import from revlog

26

from .node import (

26

from .node import (

27

bin,

27

bin,

28

hex,

28

hex,

29

nullrev,

29

nullrev,

30

sha1nodeconstants,

30

sha1nodeconstants,

31

short,

31

short,

32

wdirrev,

32

wdirrev,

33

)

33

)

34

from .i18n import _

34

from .i18n import _

35

from .revlogutils.constants import (

35

from .revlogutils.constants import (

36

ALL_KINDS,

36

ALL_KINDS,

37

CHANGELOGV2,

37

CHANGELOGV2,

38

COMP_MODE_DEFAULT,

38

COMP_MODE_DEFAULT,

39

COMP_MODE_INLINE,

39

COMP_MODE_INLINE,

40

COMP_MODE_PLAIN,

40

COMP_MODE_PLAIN,

41

DELTA_BASE_REUSE_NO,

41

DELTA_BASE_REUSE_NO,

42

DELTA_BASE_REUSE_TRY,

42

DELTA_BASE_REUSE_TRY,

43

ENTRY_RANK,

43

ENTRY_RANK,

44

FEATURES_BY_VERSION,

44

FEATURES_BY_VERSION,

45

FLAG_GENERALDELTA,

45

FLAG_GENERALDELTA,

46

FLAG_INLINE_DATA,

46

FLAG_INLINE_DATA,

47

INDEX_HEADER,

47

INDEX_HEADER,

48

KIND_CHANGELOG,

48

KIND_CHANGELOG,

49

KIND_FILELOG,

49

KIND_FILELOG,

50

RANK_UNKNOWN,

50

RANK_UNKNOWN,

51

REVLOGV0,

51

REVLOGV0,

52

REVLOGV1,

52

REVLOGV1,

53

REVLOGV1_FLAGS,

53

REVLOGV1_FLAGS,

54

REVLOGV2,

54

REVLOGV2,

55

REVLOGV2_FLAGS,

55

REVLOGV2_FLAGS,

56

REVLOG_DEFAULT_FLAGS,

56

REVLOG_DEFAULT_FLAGS,

57

REVLOG_DEFAULT_FORMAT,

57

REVLOG_DEFAULT_FORMAT,

58

REVLOG_DEFAULT_VERSION,

58

REVLOG_DEFAULT_VERSION,

59

SUPPORTED_FLAGS,

59

SUPPORTED_FLAGS,

60

)

60

)

61

from .revlogutils.flagutil import (

61

from .revlogutils.flagutil import (

62

REVIDX_DEFAULT_FLAGS,

62

REVIDX_DEFAULT_FLAGS,

63

REVIDX_ELLIPSIS,

63

REVIDX_ELLIPSIS,

64

REVIDX_EXTSTORED,

64

REVIDX_EXTSTORED,

65

REVIDX_FLAGS_ORDER,

65

REVIDX_FLAGS_ORDER,

66

REVIDX_HASCOPIESINFO,

66

REVIDX_HASCOPIESINFO,

67

REVIDX_ISCENSORED,

67

REVIDX_ISCENSORED,

68

REVIDX_RAWTEXT_CHANGING_FLAGS,

68

REVIDX_RAWTEXT_CHANGING_FLAGS,

69

)

69

)

70

from .thirdparty import attr

70

from .thirdparty import attr

71

from . import (

71

from . import (

72

ancestor,

72

ancestor,

73

dagop,

73

dagop,

74

error,

74

error,

75

mdiff,

75

mdiff,

76

policy,

76

policy,

77

pycompat,

77

pycompat,

78

revlogutils,

78

revlogutils,

79

templatefilters,

79

templatefilters,

80

util,

80

util,

81

)

81

)

82

from .interfaces import (

82

from .interfaces import (

83

repository,

83

repository,

84

util as interfaceutil,

84

util as interfaceutil,

85

)

85

)

86

from .revlogutils import (

86

from .revlogutils import (

87

deltas as deltautil,

87

deltas as deltautil,

88

docket as docketutil,

88

docket as docketutil,

89

flagutil,

89

flagutil,

90

nodemap as nodemaputil,

90

nodemap as nodemaputil,

91

randomaccessfile,

91

randomaccessfile,

92

revlogv0,

92

revlogv0,

93

rewrite,

93

rewrite,

94

sidedata as sidedatautil,

94

sidedata as sidedatautil,

95

)

95

)

96

from .utils import (

96

from .utils import (

97

storageutil,

97

storageutil,

98

stringutil,

98

stringutil,

99

)

99

)

100

101

# blanked usage of all the name to prevent pyflakes constraints

101

# blanked usage of all the name to prevent pyflakes constraints

102

# We need these name available in the module for extensions.

102

# We need these name available in the module for extensions.

103

104

REVLOGV0

104

REVLOGV0

105

REVLOGV1

105

REVLOGV1

106

REVLOGV2

106

REVLOGV2

107

CHANGELOGV2

107

CHANGELOGV2

108

FLAG_INLINE_DATA

108

FLAG_INLINE_DATA

109

FLAG_GENERALDELTA

109

FLAG_GENERALDELTA

110

REVLOG_DEFAULT_FLAGS

110

REVLOG_DEFAULT_FLAGS

111

REVLOG_DEFAULT_FORMAT

111

REVLOG_DEFAULT_FORMAT

112

REVLOG_DEFAULT_VERSION

112

REVLOG_DEFAULT_VERSION

113

REVLOGV1_FLAGS

113

REVLOGV1_FLAGS

114

REVLOGV2_FLAGS

114

REVLOGV2_FLAGS

115

REVIDX_ISCENSORED

115

REVIDX_ISCENSORED

116

REVIDX_ELLIPSIS

116

REVIDX_ELLIPSIS

117

REVIDX_HASCOPIESINFO

117

REVIDX_HASCOPIESINFO

118

REVIDX_EXTSTORED

118

REVIDX_EXTSTORED

119

REVIDX_DEFAULT_FLAGS

119

REVIDX_DEFAULT_FLAGS

120

REVIDX_FLAGS_ORDER

120

REVIDX_FLAGS_ORDER

121

REVIDX_RAWTEXT_CHANGING_FLAGS

121

REVIDX_RAWTEXT_CHANGING_FLAGS

122

123

parsers = policy.importmod('parsers')

123

parsers = policy.importmod('parsers')

124

rustancestor = policy.importrust('ancestor')

124

rustancestor = policy.importrust('ancestor')

125

rustdagop = policy.importrust('dagop')

125

rustdagop = policy.importrust('dagop')

126

rustrevlog = policy.importrust('revlog')

126

rustrevlog = policy.importrust('revlog')

127

128

# Aliased for performance.

128

# Aliased for performance.

129

_zlibdecompress = zlib.decompress

129

_zlibdecompress = zlib.decompress

130

131

# max size of inline data embedded into a revlog

131

# max size of inline data embedded into a revlog

132

_maxinline = 131072

132

_maxinline = 131072

133

134

# Flag processors for REVIDX_ELLIPSIS.

134

# Flag processors for REVIDX_ELLIPSIS.

135

def ellipsisreadprocessor(rl, text):

135

def ellipsisreadprocessor(rl, text):

136

return text, False

136

return text, False

137

138

139

def ellipsiswriteprocessor(rl, text):

139

def ellipsiswriteprocessor(rl, text):

140

return text, False

140

return text, False

141

142

143

def ellipsisrawprocessor(rl, text):

143

def ellipsisrawprocessor(rl, text):

144

return False

144

return False

145

146

147

ellipsisprocessor = (

147

ellipsisprocessor = (

148

ellipsisreadprocessor,

148

ellipsisreadprocessor,

149

ellipsiswriteprocessor,

149

ellipsiswriteprocessor,

150

ellipsisrawprocessor,

150

ellipsisrawprocessor,

151

)

151

)

152

153

154

def _verify_revision(rl, skipflags, state, node):

154

def _verify_revision(rl, skipflags, state, node):

155

"""Verify the integrity of the given revlog ``node`` while providing a hook

155

"""Verify the integrity of the given revlog ``node`` while providing a hook

156

point for extensions to influence the operation."""

156

point for extensions to influence the operation."""

157

if skipflags:

157

if skipflags:

158

state[b'skipread'].add(node)

158

state[b'skipread'].add(node)

159

else:

159

else:

160

# Side-effect: read content and verify hash.

160

# Side-effect: read content and verify hash.

161

rl.revision(node)

161

rl.revision(node)

162

163

164

# True if a fast implementation for persistent-nodemap is available

164

# True if a fast implementation for persistent-nodemap is available

165

#

165

#

166

# We also consider we have a "fast" implementation in "pure" python because

166

# We also consider we have a "fast" implementation in "pure" python because

167

# people using pure don't really have performance consideration (and a

167

# people using pure don't really have performance consideration (and a

168

# wheelbarrow of other slowness source)

168

# wheelbarrow of other slowness source)

169

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

169

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

170

parsers, 'BaseIndexObject'

170

parsers, 'BaseIndexObject'

171

)

171

)

172

173

174

@interfaceutil.implementer(repository.irevisiondelta)

174

@interfaceutil.implementer(repository.irevisiondelta)

175

@attr.s(slots=True)

175

@attr.s(slots=True)

176

class revlogrevisiondelta:

176

class revlogrevisiondelta:

177

node = attr.ib()

177

node = attr.ib()

178

p1node = attr.ib()

178

p1node = attr.ib()

179

p2node = attr.ib()

179

p2node = attr.ib()

180

basenode = attr.ib()

180

basenode = attr.ib()

181

flags = attr.ib()

181

flags = attr.ib()

182

baserevisionsize = attr.ib()

182

baserevisionsize = attr.ib()

183

revision = attr.ib()

183

revision = attr.ib()

184

delta = attr.ib()

184

delta = attr.ib()

185

sidedata = attr.ib()

185

sidedata = attr.ib()

186

protocol_flags = attr.ib()

186

protocol_flags = attr.ib()

187

linknode = attr.ib(default=None)

187

linknode = attr.ib(default=None)

188

189

190

@interfaceutil.implementer(repository.iverifyproblem)

190

@interfaceutil.implementer(repository.iverifyproblem)

191

@attr.s(frozen=True)

191

@attr.s(frozen=True)

192

class revlogproblem:

192

class revlogproblem:

193

warning = attr.ib(default=None)

193

warning = attr.ib(default=None)

194

error = attr.ib(default=None)

194

error = attr.ib(default=None)

195

node = attr.ib(default=None)

195

node = attr.ib(default=None)

196

197

198

def parse_index_v1(data, inline):

198

def parse_index_v1(data, inline):

199

# call the C implementation to parse the index data

199

# call the C implementation to parse the index data

200

index, cache = parsers.parse_index2(data, inline)

200

index, cache = parsers.parse_index2(data, inline)

201

return index, cache

201

return index, cache

202

203

204

def parse_index_v2(data, inline):

204

def parse_index_v2(data, inline):

205

# call the C implementation to parse the index data

205

# call the C implementation to parse the index data

206

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

206

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

207

return index, cache

207

return index, cache

208

209

210

def parse_index_cl_v2(data, inline):

210

def parse_index_cl_v2(data, inline):

211

# call the C implementation to parse the index data

211

# call the C implementation to parse the index data

212

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

212

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

213

return index, cache

213

return index, cache

214

215

216

if hasattr(parsers, 'parse_index_devel_nodemap'):

216

if hasattr(parsers, 'parse_index_devel_nodemap'):

217

218

def parse_index_v1_nodemap(data, inline):

218

def parse_index_v1_nodemap(data, inline):

219

index, cache = parsers.parse_index_devel_nodemap(data, inline)

219

index, cache = parsers.parse_index_devel_nodemap(data, inline)

220

return index, cache

220

return index, cache

221

222

223

else:

223

else:

224

parse_index_v1_nodemap = None

224

parse_index_v1_nodemap = None

225

226

227

def parse_index_v1_mixed(data, inline):

227

def parse_index_v1_mixed(data, inline):

228

index, cache = parse_index_v1(data, inline)

228

index, cache = parse_index_v1(data, inline)

229

return rustrevlog.MixedIndex(index), cache

229

return rustrevlog.MixedIndex(index), cache

230

231

232

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

232

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

233

# signed integer)

233

# signed integer)

234

_maxentrysize = 0x7FFFFFFF

234

_maxentrysize = 0x7FFFFFFF

235

236

FILE_TOO_SHORT_MSG = _(

236

FILE_TOO_SHORT_MSG = _(

237

b'cannot read from revlog %s;'

237

b'cannot read from revlog %s;'

238

b' expected %d bytes from offset %d, data size is %d'

238

b' expected %d bytes from offset %d, data size is %d'

239

)

239

)

240

241

hexdigits = b'0123456789abcdefABCDEF'

241

hexdigits = b'0123456789abcdefABCDEF'

242

243

244

class _Config:

244

class _Config:

245

def copy(self):

245

def copy(self):

246

return self.__class__(**self.__dict__)

246

return self.__class__(**self.__dict__)

247

248

249

@attr.s()

249

@attr.s()

250

class FeatureConfig(_Config):

250

class FeatureConfig(_Config):

251

"""Hold configuration values about the available revlog features"""

251

"""Hold configuration values about the available revlog features"""

252

253

# the default compression engine

253

# the default compression engine

254

compression_engine = attr.ib(default=b'zlib')

254

compression_engine = attr.ib(default=b'zlib')

255

# compression engines options

255

# compression engines options

256

compression_engine_options = attr.ib(default=attr.Factory(dict))

256

compression_engine_options = attr.ib(default=attr.Factory(dict))

257

258

# can we use censor on this revlog

258

# can we use censor on this revlog

259

censorable = attr.ib(default=False)

259

censorable = attr.ib(default=False)

260

# does this revlog use the "side data" feature

260

# does this revlog use the "side data" feature

261

has_side_data = attr.ib(default=False)

261

has_side_data = attr.ib(default=False)

262

# might remove rank configuration once the computation has no impact

262

# might remove rank configuration once the computation has no impact

263

compute_rank = attr.ib(default=False)

263

compute_rank = attr.ib(default=False)

264

# parent order is supposed to be semantically irrelevant, so we

264

# parent order is supposed to be semantically irrelevant, so we

265

# normally resort parents to ensure that the first parent is non-null,

265

# normally resort parents to ensure that the first parent is non-null,

266

# if there is a non-null parent at all.

266

# if there is a non-null parent at all.

267

# filelog abuses the parent order as flag to mark some instances of

267

# filelog abuses the parent order as flag to mark some instances of

268

# meta-encoded files, so allow it to disable this behavior.

268

# meta-encoded files, so allow it to disable this behavior.

269

canonical_parent_order = attr.ib(default=False)

269

canonical_parent_order = attr.ib(default=False)

270

# can ellipsis commit be used

270

# can ellipsis commit be used

271

enable_ellipsis = attr.ib(default=False)

271

enable_ellipsis = attr.ib(default=False)

272

273

def copy(self):

273

def copy(self):

274

new = super().copy()

274

new = super().copy()

275

new.compression_engine_options = self.compression_engine_options.copy()

275

new.compression_engine_options = self.compression_engine_options.copy()

276

return new

276

return new

277

278

279

@attr.s()

279

@attr.s()

280

class DataConfig(_Config):

280

class DataConfig(_Config):

281

"""Hold configuration value about how the revlog data are read"""

281

"""Hold configuration value about how the revlog data are read"""

282

283

# should we try to open the "pending" version of the revlog

283

# should we try to open the "pending" version of the revlog

284

try_pending = attr.ib(default=False)

284

try_pending = attr.ib(default=False)

285

# should we try to open the "splitted" version of the revlog

285

# should we try to open the "splitted" version of the revlog

286

try_split = attr.ib(default=False)

286

try_split = attr.ib(default=False)

287

# When True, indexfile should be opened with checkambig=True at writing,

287

# When True, indexfile should be opened with checkambig=True at writing,

288

# to avoid file stat ambiguity.

288

# to avoid file stat ambiguity.

289

check_ambig = attr.ib(default=False)

289

check_ambig = attr.ib(default=False)

290

291

# If true, use mmap instead of reading to deal with large index

291

# If true, use mmap instead of reading to deal with large index

292

mmap_large_index = attr.ib(default=False)

292

mmap_large_index = attr.ib(default=False)

293

# how much data is large

293

# how much data is large

294

mmap_index_threshold = attr.ib(default=None)

294

mmap_index_threshold = attr.ib(default=None)

295

# How much data to read and cache into the raw revlog data cache.

295

# How much data to read and cache into the raw revlog data cache.

296

chunk_cache_size = attr.ib(default=65536)

296

chunk_cache_size = attr.ib(default=65536)

297

298

# Allow sparse reading of the revlog data

298

# Allow sparse reading of the revlog data

299

with_sparse_read = attr.ib(default=False)

299

with_sparse_read = attr.ib(default=False)

300

# minimal density of a sparse read chunk

300

# minimal density of a sparse read chunk

301

sr_density_threshold = attr.ib(default=0.50)

301

sr_density_threshold = attr.ib(default=0.50)

302

# minimal size of data we skip when performing sparse read

302

# minimal size of data we skip when performing sparse read

303

sr_min_gap_size = attr.ib(default=262144)

303

sr_min_gap_size = attr.ib(default=262144)

304

305

# are delta encoded against arbitrary bases.

305

# are delta encoded against arbitrary bases.

306

generaldelta = attr.ib(default=False)

306

generaldelta = attr.ib(default=False)

307

308

309

@attr.s()

309

@attr.s()

310

class DeltaConfig(_Config):

310

class DeltaConfig(_Config):

311

"""Hold configuration value about how new delta are computed

311

"""Hold configuration value about how new delta are computed

312

313

Some attributes are duplicated from DataConfig to help havign each object

313

Some attributes are duplicated from DataConfig to help havign each object

314

self contained.

314

self contained.

315

"""

315

"""

316

317

# can delta be encoded against arbitrary bases.

317

# can delta be encoded against arbitrary bases.

318

general_delta = attr.ib(default=False)

318

general_delta = attr.ib(default=False)

319

# Allow sparse writing of the revlog data

319

# Allow sparse writing of the revlog data

320

sparse_revlog = attr.ib(default=False)

320

sparse_revlog = attr.ib(default=False)

321

# maximum length of a delta chain

321

# maximum length of a delta chain

322

max_chain_len = attr.ib(default=None)

322

max_chain_len = attr.ib(default=None)

323

# Maximum distance between delta chain base start and end

323

# Maximum distance between delta chain base start and end

324

max_deltachain_span = attr.ib(default=-1)

324

max_deltachain_span = attr.ib(default=-1)

325

# If `upper_bound_comp` is not None, this is the expected maximal gain from

325

# If `upper_bound_comp` is not None, this is the expected maximal gain from

326

# compression for the data content.

326

# compression for the data content.

327

upper_bound_comp = attr.ib(default=None)

327

upper_bound_comp = attr.ib(default=None)

328

# Should we try a delta against both parent

328

# Should we try a delta against both parent

329

delta_both_parents = attr.ib(default=True)

329

delta_both_parents = attr.ib(default=True)

330

# Test delta base candidate group by chunk of this maximal size.

330

# Test delta base candidate group by chunk of this maximal size.

331

candidate_group_chunk_size = attr.ib(default=0)

331

candidate_group_chunk_size = attr.ib(default=0)

332

# Should we display debug information about delta computation

332

# Should we display debug information about delta computation

333

debug_delta = attr.ib(default=False)

333

debug_delta = attr.ib(default=False)

334

# trust incoming delta by default

334

# trust incoming delta by default

335

lazy_delta = attr.ib(default=True)

335

lazy_delta = attr.ib(default=True)

336

# trust the base of incoming delta by default

336

# trust the base of incoming delta by default

337

lazy_delta_base = attr.ib(default=False)

337

lazy_delta_base = attr.ib(default=False)

338

339

340

class _InnerRevlog:

340

class _InnerRevlog:

341

"""An inner layer of the revlog object

341

"""An inner layer of the revlog object

342

343

That layer exist to be able to delegate some operation to Rust, its

343

That layer exist to be able to delegate some operation to Rust, its

344

boundaries are arbitrary and based on what we can delegate to Rust.

344

boundaries are arbitrary and based on what we can delegate to Rust.

345

"""

345

"""

346

347

def __init__(

347

def __init__(

348

self,

348

self,

349

opener,

349

opener,

350

index,

350

index,

351

index_file,

351

index_file,

352

data_file,

352

data_file,

353

sidedata_file,

353

sidedata_file,

354

inline,

354

inline,

355

data_config,

355

data_config,

356

delta_config,

356

delta_config,

357

feature_config,

357

feature_config,

358

chunk_cache,

358

chunk_cache,

359

default_compression_header,

359

default_compression_header,

360

):

360

):

361

self.opener = opener

361

self.opener = opener

362

self.index = index

362

self.index = index

363

364

self.__index_file = index_file

364

self.__index_file = index_file

365

self.data_file = data_file

365

self.data_file = data_file

366

self.sidedata_file = sidedata_file

366

self.sidedata_file = sidedata_file

367

self.inline = inline

367

self.inline = inline

368

self.data_config = data_config

368

self.data_config = data_config

369

self.delta_config = delta_config

369

self.delta_config = delta_config

370

self.feature_config = feature_config

370

self.feature_config = feature_config

371

372

self._default_compression_header = default_compression_header

372

self._default_compression_header = default_compression_header

373

374

# index

374

# index

375

376

# 3-tuple of file handles being used for active writing.

376

# 3-tuple of file handles being used for active writing.

377

self._writinghandles = None

377

self._writinghandles = None

378

379

self._segmentfile = randomaccessfile.randomaccessfile(

379

self._segmentfile = randomaccessfile.randomaccessfile(

380

self.opener,

380

self.opener,

381

(self.index_file if self.inline else self.data_file),

381

(self.index_file if self.inline else self.data_file),

382

self.data_config.chunk_cache_size,

382

self.data_config.chunk_cache_size,

383

chunk_cache,

383

chunk_cache,

384

)

384

)

385

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

385

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

386

self.opener,

386

self.opener,

387

self.sidedata_file,

387

self.sidedata_file,

388

self.data_config.chunk_cache_size,

388

self.data_config.chunk_cache_size,

389

)

389

)

390

391

# revlog header -> revlog compressor

391

# revlog header -> revlog compressor

392

self._decompressors = {}

392

self._decompressors = {}

393

# 3-tuple of (node, rev, text) for a raw revision.

393

# 3-tuple of (node, rev, text) for a raw revision.

394

self._revisioncache = None

394

self._revisioncache = None

395

396

@property

396

@property

397

def index_file(self):

397

def index_file(self):

398

return self.__index_file

398

return self.__index_file

399

400

@index_file.setter

400

@index_file.setter

401

def index_file(self, new_index_file):

401

def index_file(self, new_index_file):

402

self.__index_file = new_index_file

402

self.__index_file = new_index_file

403

if self.inline:

403

if self.inline:

404

self._segmentfile.filename = new_index_file

404

self._segmentfile.filename = new_index_file

405

406

def __len__(self):

406

def __len__(self):

407

return len(self.index)

407

return len(self.index)

408

409

def clear_cache(self):

409

def clear_cache(self):

410

self._revisioncache = None

410

self._revisioncache = None

411

self._segmentfile.clear_cache()

411

self._segmentfile.clear_cache()

412

self._segmentfile_sidedata.clear_cache()

412

self._segmentfile_sidedata.clear_cache()

413

414

@property

415

def canonical_index_file(self):

416

return self.index_file

417

414

# Derived from index values.

418

# Derived from index values.

415

419

416

def start(self, rev):

420

def start(self, rev):

417

"""the offset of the data chunk for this revision"""

421

"""the offset of the data chunk for this revision"""

418

return int(self.index[rev][0] >> 16)

422

return int(self.index[rev][0] >> 16)

419

423

420

def length(self, rev):

424

def length(self, rev):

421

"""the length of the data chunk for this revision"""

425

"""the length of the data chunk for this revision"""

422

return self.index[rev][1]

426

return self.index[rev][1]

423

427

424

def end(self, rev):

428

def end(self, rev):

425

"""the end of the data chunk for this revision"""

429

"""the end of the data chunk for this revision"""

426

return self.start(rev) + self.length(rev)

430

return self.start(rev) + self.length(rev)

427

431

428

def deltaparent(self, rev):

432

def deltaparent(self, rev):

429

"""return deltaparent of the given revision"""

433

"""return deltaparent of the given revision"""

430

base = self.index[rev][3]

434

base = self.index[rev][3]

431

if base == rev:

435

if base == rev:

432

return nullrev

436

return nullrev

433

elif self.delta_config.general_delta:

437

elif self.delta_config.general_delta:

434

return base

438

return base

435

else:

439

else:

436

return rev - 1

440

return rev - 1

437

441

438

def issnapshot(self, rev):

442

def issnapshot(self, rev):

439

"""tells whether rev is a snapshot"""

443

"""tells whether rev is a snapshot"""

440

if not self.delta_config.sparse_revlog:

444

if not self.delta_config.sparse_revlog:

441

return self.deltaparent(rev) == nullrev

445

return self.deltaparent(rev) == nullrev

442

elif hasattr(self.index, 'issnapshot'):

446

elif hasattr(self.index, 'issnapshot'):

443

# directly assign the method to cache the testing and access

447

# directly assign the method to cache the testing and access

444

self.issnapshot = self.index.issnapshot

448

self.issnapshot = self.index.issnapshot

445

return self.issnapshot(rev)

449

return self.issnapshot(rev)

446

if rev == nullrev:

450

if rev == nullrev:

447

return True

451

return True

448

entry = self.index[rev]

452

entry = self.index[rev]

449

base = entry[3]

453

base = entry[3]

450

if base == rev:

454

if base == rev:

451

return True

455

return True

452

if base == nullrev:

456

if base == nullrev:

453

return True

457

return True

454

p1 = entry[5]

458

p1 = entry[5]

455

while self.length(p1) == 0:

459

while self.length(p1) == 0:

456

b = self.deltaparent(p1)

460

b = self.deltaparent(p1)

457

if b == p1:

461

if b == p1:

458

break

462

break

459

p1 = b

463

p1 = b

460

p2 = entry[6]

464

p2 = entry[6]

461

while self.length(p2) == 0:

465

while self.length(p2) == 0:

462

b = self.deltaparent(p2)

466

b = self.deltaparent(p2)

463

if b == p2:

467

if b == p2:

464

break

468

break

465

p2 = b

469

p2 = b

466

if base == p1 or base == p2:

470

if base == p1 or base == p2:

467

return False

471

return False

468

return self.issnapshot(base)

472

return self.issnapshot(base)

469

473

470

def _deltachain(self, rev, stoprev=None):

474

def _deltachain(self, rev, stoprev=None):

471

"""Obtain the delta chain for a revision.

475

"""Obtain the delta chain for a revision.

472

476

473

``stoprev`` specifies a revision to stop at. If not specified, we

477

``stoprev`` specifies a revision to stop at. If not specified, we

474

stop at the base of the chain.

478

stop at the base of the chain.

475

479

476

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

480

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

477

revs in ascending order and ``stopped`` is a bool indicating whether

481

revs in ascending order and ``stopped`` is a bool indicating whether

478

``stoprev`` was hit.

482

``stoprev`` was hit.

479

"""

483

"""

480

generaldelta = self.delta_config.general_delta

484

generaldelta = self.delta_config.general_delta

481

# Try C implementation.

485

# Try C implementation.

482

try:

486

try:

483

return self.index.deltachain(rev, stoprev, generaldelta)

487

return self.index.deltachain(rev, stoprev, generaldelta)

484

except AttributeError:

488

except AttributeError:

485

pass

489

pass

486

490

487

chain = []

491

chain = []

488

492

489

# Alias to prevent attribute lookup in tight loop.

493

# Alias to prevent attribute lookup in tight loop.

490

index = self.index

494

index = self.index

491

495

492

iterrev = rev

496

iterrev = rev

493

e = index[iterrev]

497

e = index[iterrev]

494

while iterrev != e[3] and iterrev != stoprev:

498

while iterrev != e[3] and iterrev != stoprev:

495

chain.append(iterrev)

499

chain.append(iterrev)

496

if generaldelta:

500

if generaldelta:

497

iterrev = e[3]

501

iterrev = e[3]

498

else:

502

else:

499

iterrev -= 1

503

iterrev -= 1

500

e = index[iterrev]

504

e = index[iterrev]

501

505

502

if iterrev == stoprev:

506

if iterrev == stoprev:

503

stopped = True

507

stopped = True

504

else:

508

else:

505

chain.append(iterrev)

509

chain.append(iterrev)

506

stopped = False

510

stopped = False

507

511

508

chain.reverse()

512

chain.reverse()

509

return chain, stopped

513

return chain, stopped

510

514

511

@util.propertycache

515

@util.propertycache

512

def _compressor(self):

516

def _compressor(self):

513

engine = util.compengines[self.feature_config.compression_engine]

517

engine = util.compengines[self.feature_config.compression_engine]

514

return engine.revlogcompressor(

518

return engine.revlogcompressor(

515

self.feature_config.compression_engine_options

519

self.feature_config.compression_engine_options

516

)

520

)

517

521

518

@util.propertycache

522

@util.propertycache

519

def _decompressor(self):

523

def _decompressor(self):

520

"""the default decompressor"""

524

"""the default decompressor"""

521

if self._default_compression_header is None:

525

if self._default_compression_header is None:

522

return None

526

return None

523

t = self._default_compression_header

527

t = self._default_compression_header

524

c = self._get_decompressor(t)

528

c = self._get_decompressor(t)

525

return c.decompress

529

return c.decompress

526

530

527

def _get_decompressor(self, t):

531

def _get_decompressor(self, t):

528

try:

532

try:

529

compressor = self._decompressors[t]

533

compressor = self._decompressors[t]

530

except KeyError:

534

except KeyError:

531

try:

535

try:

532

engine = util.compengines.forrevlogheader(t)

536

engine = util.compengines.forrevlogheader(t)

533

compressor = engine.revlogcompressor(

537

compressor = engine.revlogcompressor(

534

self.feature_config.compression_engine_options

538

self.feature_config.compression_engine_options

535

)

539

)

536

self._decompressors[t] = compressor

540

self._decompressors[t] = compressor

537

except KeyError:

541

except KeyError:

538

raise error.RevlogError(

542

raise error.RevlogError(

539

_(b'unknown compression type %s') % binascii.hexlify(t)

543

_(b'unknown compression type %s') % binascii.hexlify(t)

540

)

544

)

541

return compressor

545

return compressor

542

546

543

def compress(self, data):

547

def compress(self, data):

544

"""Generate a possibly-compressed representation of data."""

548

"""Generate a possibly-compressed representation of data."""

545

if not data:

549

if not data:

546

return b'', data

550

return b'', data

547

551

548

compressed = self._compressor.compress(data)

552

compressed = self._compressor.compress(data)

549

553

550

if compressed:

554

if compressed:

551

# The revlog compressor added the header in the returned data.

555

# The revlog compressor added the header in the returned data.

552

return b'', compressed

556

return b'', compressed

553

557

554

if data[0:1] == b'\0':

558

if data[0:1] == b'\0':

555

return b'', data

559

return b'', data

556

return b'u', data

560

return b'u', data

557

561

558

def decompress(self, data):

562

def decompress(self, data):

559

"""Decompress a revlog chunk.

563

"""Decompress a revlog chunk.

560

564

561

The chunk is expected to begin with a header identifying the

565

The chunk is expected to begin with a header identifying the

562

format type so it can be routed to an appropriate decompressor.

566

format type so it can be routed to an appropriate decompressor.

563

"""

567

"""

564

if not data:

568

if not data:

565

return data

569

return data

566

570

567

# Revlogs are read much more frequently than they are written and many

571

# Revlogs are read much more frequently than they are written and many

568

# chunks only take microseconds to decompress, so performance is

572

# chunks only take microseconds to decompress, so performance is

569

# important here.

573

# important here.

570

#

574

#

571

# We can make a few assumptions about revlogs:

575

# We can make a few assumptions about revlogs:

572

#

576

#

573

# 1) the majority of chunks will be compressed (as opposed to inline

577

# 1) the majority of chunks will be compressed (as opposed to inline

574

# raw data).

578

# raw data).

575

# 2) decompressing *any* data will likely by at least 10x slower than

579

# 2) decompressing *any* data will likely by at least 10x slower than

576

# returning raw inline data.

580

# returning raw inline data.

577

# 3) we want to prioritize common and officially supported compression

581

# 3) we want to prioritize common and officially supported compression

578

# engines

582

# engines

579

#

583

#

580

# It follows that we want to optimize for "decompress compressed data

584

# It follows that we want to optimize for "decompress compressed data

581

# when encoded with common and officially supported compression engines"

585

# when encoded with common and officially supported compression engines"

582

# case over "raw data" and "data encoded by less common or non-official

586

# case over "raw data" and "data encoded by less common or non-official

583

# compression engines." That is why we have the inline lookup first

587

# compression engines." That is why we have the inline lookup first

584

# followed by the compengines lookup.

588

# followed by the compengines lookup.

585

#

589

#

586

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

590

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

587

# compressed chunks. And this matters for changelog and manifest reads.

591

# compressed chunks. And this matters for changelog and manifest reads.

588

t = data[0:1]

592

t = data[0:1]

589

593

590

if t == b'x':

594

if t == b'x':

591

try:

595

try:

592

return _zlibdecompress(data)

596

return _zlibdecompress(data)

593

except zlib.error as e:

597

except zlib.error as e:

594

raise error.RevlogError(

598

raise error.RevlogError(

595

_(b'revlog decompress error: %s')

599

_(b'revlog decompress error: %s')

596

% stringutil.forcebytestr(e)

600

% stringutil.forcebytestr(e)

597

)

601

)

598

# '\0' is more common than 'u' so it goes first.

602

# '\0' is more common than 'u' so it goes first.

599

elif t == b'\0':

603

elif t == b'\0':

600

return data

604

return data

601

elif t == b'u':

605

elif t == b'u':

602

return util.buffer(data, 1)

606

return util.buffer(data, 1)

603

607

604

compressor = self._get_decompressor(t)

608

compressor = self._get_decompressor(t)

605

609

606

return compressor.decompress(data)

610

return compressor.decompress(data)

607

611

608

@contextlib.contextmanager

612

@contextlib.contextmanager

609

def reading(self):

613

def reading(self):

610

"""Context manager that keeps data and sidedata files open for reading"""

614

"""Context manager that keeps data and sidedata files open for reading"""

611

if len(self.index) == 0:

615

if len(self.index) == 0:

612

yield # nothing to be read

616

yield # nothing to be read

613

else:

617

else:

614

with self._segmentfile.reading():

618

with self._segmentfile.reading():

615

with self._segmentfile_sidedata.reading():

619

with self._segmentfile_sidedata.reading():

616

yield

620

yield

617

621

618

@property

622

@property

619

def is_writing(self):

623

def is_writing(self):

620

"""True is a writing context is open"""

624

"""True is a writing context is open"""

621

return self._writinghandles is not None

625

return self._writinghandles is not None

622

626

623

@property

627

@property

624

def is_open(self):

628

def is_open(self):

625

"""True if any file handle is being held

629

"""True if any file handle is being held

626

630

627

Used for assert and debug in the python code"""

631

Used for assert and debug in the python code"""

628

return self._segmentfile.is_open or self._segmentfile_sidedata.is_open

632

return self._segmentfile.is_open or self._segmentfile_sidedata.is_open

629

633

630

@contextlib.contextmanager

634

@contextlib.contextmanager

631

def writing(self, transaction, data_end=None, sidedata_end=None):

635

def writing(self, transaction, data_end=None, sidedata_end=None):

632

"""Open the revlog files for writing

636

"""Open the revlog files for writing

633

637

634

Add content to a revlog should be done within such context.

638

Add content to a revlog should be done within such context.

635

"""

639

"""

636

if self.is_writing:

640

if self.is_writing:

637

yield

641

yield

638

else:

642

else:

639

ifh = dfh = sdfh = None

643

ifh = dfh = sdfh = None

640

try:

644

try:

641

r = len(self.index)

645

r = len(self.index)

642

# opening the data file.

646

# opening the data file.

643

dsize = 0

647

dsize = 0

644

if r:

648

if r:

645

dsize = self.end(r - 1)

649

dsize = self.end(r - 1)

646

dfh = None

650

dfh = None

647

if not self.inline:

651

if not self.inline:

648

try:

652

try:

649

dfh = self.opener(self.data_file, mode=b"r+")

653

dfh = self.opener(self.data_file, mode=b"r+")

650

if data_end is None:

654

if data_end is None:

651

dfh.seek(0, os.SEEK_END)

655

dfh.seek(0, os.SEEK_END)

652

else:

656

else:

653

dfh.seek(data_end, os.SEEK_SET)

657

dfh.seek(data_end, os.SEEK_SET)

654

except FileNotFoundError:

658

except FileNotFoundError:

655

dfh = self.opener(self.data_file, mode=b"w+")

659

dfh = self.opener(self.data_file, mode=b"w+")

656

transaction.add(self.data_file, dsize)

660

transaction.add(self.data_file, dsize)

657

if self.sidedata_file is not None:

661

if self.sidedata_file is not None:

658

assert sidedata_end is not None

662

assert sidedata_end is not None

659

# revlog-v2 does not inline, help Pytype

663

# revlog-v2 does not inline, help Pytype

660

assert dfh is not None

664

assert dfh is not None

661

try:

665

try:

662

sdfh = self.opener(self.sidedata_file, mode=b"r+")

666

sdfh = self.opener(self.sidedata_file, mode=b"r+")

663

dfh.seek(sidedata_end, os.SEEK_SET)

667

dfh.seek(sidedata_end, os.SEEK_SET)

664

except FileNotFoundError:

668

except FileNotFoundError:

665

sdfh = self.opener(self.sidedata_file, mode=b"w+")

669

sdfh = self.opener(self.sidedata_file, mode=b"w+")

666

transaction.add(self.sidedata_file, sidedata_end)

670

transaction.add(self.sidedata_file, sidedata_end)

667

671

668

# opening the index file.

672

# opening the index file.

669

isize = r * self.index.entry_size

673

isize = r * self.index.entry_size

670

ifh = self.__index_write_fp()

674

ifh = self.__index_write_fp()

671

if self.inline:

675

if self.inline:

672

transaction.add(self.index_file, dsize + isize)

676

transaction.add(self.index_file, dsize + isize)

673

else:

677

else:

674

transaction.add(self.index_file, isize)

678

transaction.add(self.index_file, isize)

675

# exposing all file handle for writing.

679

# exposing all file handle for writing.

676

self._writinghandles = (ifh, dfh, sdfh)

680

self._writinghandles = (ifh, dfh, sdfh)

677

self._segmentfile.writing_handle = ifh if self.inline else dfh

681

self._segmentfile.writing_handle = ifh if self.inline else dfh

678

self._segmentfile_sidedata.writing_handle = sdfh

682

self._segmentfile_sidedata.writing_handle = sdfh

679

yield

683

yield

680

finally:

684

finally:

681

self._writinghandles = None

685

self._writinghandles = None

682

self._segmentfile.writing_handle = None

686

self._segmentfile.writing_handle = None

683

self._segmentfile_sidedata.writing_handle = None

687

self._segmentfile_sidedata.writing_handle = None

684

if dfh is not None:

688

if dfh is not None:

685

dfh.close()

689

dfh.close()

686

if sdfh is not None:

690

if sdfh is not None:

687

sdfh.close()

691

sdfh.close()

688

# closing the index file last to avoid exposing referent to

692

# closing the index file last to avoid exposing referent to

689

# potential unflushed data content.

693

# potential unflushed data content.

690

if ifh is not None:

694

if ifh is not None:

691

ifh.close()

695

ifh.close()

692

696

693

def __index_write_fp(self, index_end=None):

697

def __index_write_fp(self, index_end=None):

694

"""internal method to open the index file for writing

698

"""internal method to open the index file for writing

695

699

696

You should not use this directly and use `_writing` instead

700

You should not use this directly and use `_writing` instead

697

"""

701

"""

698

try:

702

try:

699

f = self.opener(

703

f = self.opener(

700

self.index_file,

704

self.index_file,

701

mode=b"r+",

705

mode=b"r+",

702

checkambig=self.data_config.check_ambig,

706

checkambig=self.data_config.check_ambig,

703

)

707

)

704

if index_end is None:

708

if index_end is None:

705

f.seek(0, os.SEEK_END)

709

f.seek(0, os.SEEK_END)

706

else:

710

else:

707

f.seek(index_end, os.SEEK_SET)

711

f.seek(index_end, os.SEEK_SET)

708

return f

712

return f

709

except FileNotFoundError:

713

except FileNotFoundError:

710

return self.opener(

714

return self.opener(

711

self.index_file,

715

self.index_file,

712

mode=b"w+",

716

mode=b"w+",

713

checkambig=self.data_config.check_ambig,

717

checkambig=self.data_config.check_ambig,

714

)

718

)

715

719

716

def __index_new_fp(self):

720

def __index_new_fp(self):

717

"""internal method to create a new index file for writing

721

"""internal method to create a new index file for writing

718

722

719

You should not use this unless you are upgrading from inline revlog

723

You should not use this unless you are upgrading from inline revlog

720

"""

724

"""

721

return self.opener(

725

return self.opener(

722

self.index_file,

726

self.index_file,

723

mode=b"w",

727

mode=b"w",

724

checkambig=self.data_config.check_ambig,

728

checkambig=self.data_config.check_ambig,

725

atomictemp=True,

729

atomictemp=True,

726

)

730

)

727

731

728

def split_inline(self, tr, header, new_index_file_path=None):

732

def split_inline(self, tr, header, new_index_file_path=None):

729

"""split the data of an inline revlog into an index and a data file"""

733

"""split the data of an inline revlog into an index and a data file"""

730

existing_handles = False

734

existing_handles = False

731

if self._writinghandles is not None:

735

if self._writinghandles is not None:

732

existing_handles = True

736

existing_handles = True

733

fp = self._writinghandles[0]

737

fp = self._writinghandles[0]

734

fp.flush()

738

fp.flush()

735

fp.close()

739

fp.close()

736

# We can't use the cached file handle after close(). So prevent

740

# We can't use the cached file handle after close(). So prevent

737

# its usage.

741

# its usage.

738

self._writinghandles = None

742

self._writinghandles = None

739

self._segmentfile.writing_handle = None

743

self._segmentfile.writing_handle = None

740

# No need to deal with sidedata writing handle as it is only

744

# No need to deal with sidedata writing handle as it is only

741

# relevant with revlog-v2 which is never inline, not reaching

745

# relevant with revlog-v2 which is never inline, not reaching

742

# this code

746

# this code

743

747

744

new_dfh = self.opener(self.data_file, mode=b"w+")

748

new_dfh = self.opener(self.data_file, mode=b"w+")

745

new_dfh.truncate(0) # drop any potentially existing data

749

new_dfh.truncate(0) # drop any potentially existing data

746

try:

750

try:

747

with self.reading():

751

with self.reading():

748

for r in range(len(self.index)):

752

for r in range(len(self.index)):

749

new_dfh.write(self.get_segment_for_revs(r, r)[1])

753

new_dfh.write(self.get_segment_for_revs(r, r)[1])

750

new_dfh.flush()

754

new_dfh.flush()

751

755

752

if new_index_file_path is not None:

756

if new_index_file_path is not None:

753

self.index_file = new_index_file_path

757

self.index_file = new_index_file_path

754

with self.__index_new_fp() as fp:

758

with self.__index_new_fp() as fp:

755

self.inline = False

759

self.inline = False

756

for i in range(len(self.index)):

760

for i in range(len(self.index)):

757

e = self.index.entry_binary(i)

761

e = self.index.entry_binary(i)

758

if i == 0:

762

if i == 0:

759

packed_header = self.index.pack_header(header)

763

packed_header = self.index.pack_header(header)

760

e = packed_header + e

764

e = packed_header + e

761

fp.write(e)

765

fp.write(e)

762

766

763

# If we don't use side-write, the temp file replace the real

767

# If we don't use side-write, the temp file replace the real

764

# index when we exit the context manager

768

# index when we exit the context manager

765

769

766

self._segmentfile = randomaccessfile.randomaccessfile(

770

self._segmentfile = randomaccessfile.randomaccessfile(

767

self.opener,

771

self.opener,

768

self.data_file,

772

self.data_file,

769

self.data_config.chunk_cache_size,

773

self.data_config.chunk_cache_size,

770

)

774

)

771

775

772

if existing_handles:

776

if existing_handles:

773

# switched from inline to conventional reopen the index

777

# switched from inline to conventional reopen the index

774

ifh = self.__index_write_fp()

778

ifh = self.__index_write_fp()

775

self._writinghandles = (ifh, new_dfh, None)

779

self._writinghandles = (ifh, new_dfh, None)

776

self._segmentfile.writing_handle = new_dfh

780

self._segmentfile.writing_handle = new_dfh

777

new_dfh = None

781

new_dfh = None

778

# No need to deal with sidedata writing handle as it is only

782

# No need to deal with sidedata writing handle as it is only

779

# relevant with revlog-v2 which is never inline, not reaching

783

# relevant with revlog-v2 which is never inline, not reaching

780

# this code

784

# this code

781

finally:

785

finally:

782

if new_dfh is not None:

786

if new_dfh is not None:

783

new_dfh.close()

787

new_dfh.close()

784

return self.index_file

788

return self.index_file

785

789

786

def get_segment_for_revs(self, startrev, endrev):

790

def get_segment_for_revs(self, startrev, endrev):

787

"""Obtain a segment of raw data corresponding to a range of revisions.

791

"""Obtain a segment of raw data corresponding to a range of revisions.

788

792

789

Accepts the start and end revisions and an optional already-open

793

Accepts the start and end revisions and an optional already-open

790

file handle to be used for reading. If the file handle is read, its

794

file handle to be used for reading. If the file handle is read, its

791

seek position will not be preserved.

795

seek position will not be preserved.

792

796

793

Requests for data may be satisfied by a cache.

797

Requests for data may be satisfied by a cache.

794

798

795

Returns a 2-tuple of (offset, data) for the requested range of

799

Returns a 2-tuple of (offset, data) for the requested range of

796

revisions. Offset is the integer offset from the beginning of the

800

revisions. Offset is the integer offset from the beginning of the

797

revlog and data is a str or buffer of the raw byte data.

801

revlog and data is a str or buffer of the raw byte data.

798

802

799

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

803

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

800

to determine where each revision's data begins and ends.

804

to determine where each revision's data begins and ends.

801

805

802

API: we should consider making this a private part of the InnerRevlog

806

API: we should consider making this a private part of the InnerRevlog

803

at some point.

807

at some point.

804

"""

808

"""

805

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

809

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

806

# (functions are expensive).

810

# (functions are expensive).

807

index = self.index

811

index = self.index

808

istart = index[startrev]

812

istart = index[startrev]

809

start = int(istart[0] >> 16)

813

start = int(istart[0] >> 16)

810

if startrev == endrev:

814

if startrev == endrev:

811

end = start + istart[1]

815

end = start + istart[1]

812

else:

816

else:

813

iend = index[endrev]

817

iend = index[endrev]

814

end = int(iend[0] >> 16) + iend[1]

818

end = int(iend[0] >> 16) + iend[1]

815

819

816

if self.inline:

820

if self.inline:

817

start += (startrev + 1) * self.index.entry_size

821

start += (startrev + 1) * self.index.entry_size

818

end += (endrev + 1) * self.index.entry_size

822

end += (endrev + 1) * self.index.entry_size

819

length = end - start

823

length = end - start

820

824

821

return start, self._segmentfile.read_chunk(start, length)

825

return start, self._segmentfile.read_chunk(start, length)

822

826

823

def _chunk(self, rev):

827

def _chunk(self, rev):

824

"""Obtain a single decompressed chunk for a revision.

828

"""Obtain a single decompressed chunk for a revision.

825

829

826

Accepts an integer revision and an optional already-open file handle

830

Accepts an integer revision and an optional already-open file handle

827

to be used for reading. If used, the seek position of the file will not

831

to be used for reading. If used, the seek position of the file will not

828

be preserved.

832

be preserved.

829

833

830

Returns a str holding uncompressed data for the requested revision.

834

Returns a str holding uncompressed data for the requested revision.

831

"""

835

"""

832

compression_mode = self.index[rev][10]

836

compression_mode = self.index[rev][10]

833

data = self.get_segment_for_revs(rev, rev)[1]

837

data = self.get_segment_for_revs(rev, rev)[1]

834

if compression_mode == COMP_MODE_PLAIN:

838

if compression_mode == COMP_MODE_PLAIN:

835

return data

839

return data

836

elif compression_mode == COMP_MODE_DEFAULT:

840

elif compression_mode == COMP_MODE_DEFAULT:

837

return self._decompressor(data)

841

return self._decompressor(data)

838

elif compression_mode == COMP_MODE_INLINE:

842

elif compression_mode == COMP_MODE_INLINE:

839

return self.decompress(data)

843

return self.decompress(data)

840

else:

844

else:

841

msg = b'unknown compression mode %d'

845

msg = b'unknown compression mode %d'

842

msg %= compression_mode

846

msg %= compression_mode

843

raise error.RevlogError(msg)

847

raise error.RevlogError(msg)

844

848

845

def _chunks(self, revs, targetsize=None):

849

def _chunks(self, revs, targetsize=None):

846

"""Obtain decompressed chunks for the specified revisions.

850

"""Obtain decompressed chunks for the specified revisions.

847

851

848

Accepts an iterable of numeric revisions that are assumed to be in

852

Accepts an iterable of numeric revisions that are assumed to be in

849

ascending order. Also accepts an optional already-open file handle

853

ascending order. Also accepts an optional already-open file handle

850

to be used for reading. If used, the seek position of the file will

854

to be used for reading. If used, the seek position of the file will

851

not be preserved.

855

not be preserved.

852

856

853

This function is similar to calling ``self._chunk()`` multiple times,

857

This function is similar to calling ``self._chunk()`` multiple times,

854

but is faster.

858

but is faster.

855

859

856

Returns a list with decompressed data for each requested revision.

860

Returns a list with decompressed data for each requested revision.

857

"""

861

"""

858

if not revs:

862

if not revs:

859

return []

863

return []

860

start = self.start

864

start = self.start

861

length = self.length

865

length = self.length

862

inline = self.inline

866

inline = self.inline

863

iosize = self.index.entry_size

867

iosize = self.index.entry_size

864

buffer = util.buffer

868

buffer = util.buffer

865

869

866

l = []

870

l = []

867

ladd = l.append

871

ladd = l.append

868

872

869

if not self.data_config.with_sparse_read:

873

if not self.data_config.with_sparse_read:

870

slicedchunks = (revs,)

874

slicedchunks = (revs,)

871

else:

875

else:

872

slicedchunks = deltautil.slicechunk(

876

slicedchunks = deltautil.slicechunk(

873

self,

877

self,

874

revs,

878

revs,

875

targetsize=targetsize,

879

targetsize=targetsize,

876

)

880

)

877

881

878

for revschunk in slicedchunks:

882

for revschunk in slicedchunks:

879

firstrev = revschunk[0]

883

firstrev = revschunk[0]

880

# Skip trailing revisions with empty diff

884

# Skip trailing revisions with empty diff

881

for lastrev in revschunk[::-1]:

885

for lastrev in revschunk[::-1]:

882

if length(lastrev) != 0:

886

if length(lastrev) != 0:

883

break

887

break

884

888

885

try:

889

try:

886

offset, data = self.get_segment_for_revs(firstrev, lastrev)

890

offset, data = self.get_segment_for_revs(firstrev, lastrev)

887

except OverflowError:

891

except OverflowError:

888

# issue4215 - we can't cache a run of chunks greater than

892

# issue4215 - we can't cache a run of chunks greater than

889

# 2G on Windows

893

# 2G on Windows

890

return [self._chunk(rev) for rev in revschunk]

894

return [self._chunk(rev) for rev in revschunk]

891

895

892

decomp = self.decompress

896

decomp = self.decompress

893

# self._decompressor might be None, but will not be used in that case

897

# self._decompressor might be None, but will not be used in that case

894

def_decomp = self._decompressor

898

def_decomp = self._decompressor

895

for rev in revschunk:

899

for rev in revschunk:

896

chunkstart = start(rev)

900

chunkstart = start(rev)

897

if inline:

901

if inline:

898

chunkstart += (rev + 1) * iosize

902

chunkstart += (rev + 1) * iosize

899

chunklength = length(rev)

903

chunklength = length(rev)

900

comp_mode = self.index[rev][10]

904

comp_mode = self.index[rev][10]

901

c = buffer(data, chunkstart - offset, chunklength)

905

c = buffer(data, chunkstart - offset, chunklength)

902

if comp_mode == COMP_MODE_PLAIN:

906

if comp_mode == COMP_MODE_PLAIN:

903

ladd(c)

907

ladd(c)

904

elif comp_mode == COMP_MODE_INLINE:

908

elif comp_mode == COMP_MODE_INLINE:

905

ladd(decomp(c))

909

ladd(decomp(c))

906

elif comp_mode == COMP_MODE_DEFAULT:

910

elif comp_mode == COMP_MODE_DEFAULT:

907

ladd(def_decomp(c))

911

ladd(def_decomp(c))

908

else:

912

else:

909

msg = b'unknown compression mode %d'

913

msg = b'unknown compression mode %d'

910

msg %= comp_mode

914

msg %= comp_mode

911

raise error.RevlogError(msg)

915

raise error.RevlogError(msg)

912

916

913

return l

917

return l

914

918

915

def raw_text(self, node, rev):

919

def raw_text(self, node, rev):

916

"""return the possibly unvalidated rawtext for a revision

920

"""return the possibly unvalidated rawtext for a revision

917

921

918

returns (rev, rawtext, validated)

922

returns (rev, rawtext, validated)

919

"""

923

"""

920

924

921

# revision in the cache (could be useful to apply delta)

925

# revision in the cache (could be useful to apply delta)

922

cachedrev = None

926

cachedrev = None

923

# An intermediate text to apply deltas to

927

# An intermediate text to apply deltas to

924

basetext = None

928

basetext = None

925

929

926

# Check if we have the entry in cache

930

# Check if we have the entry in cache

927

# The cache entry looks like (node, rev, rawtext)

931

# The cache entry looks like (node, rev, rawtext)

928

if self._revisioncache:

932

if self._revisioncache:

929

cachedrev = self._revisioncache[1]

933

cachedrev = self._revisioncache[1]

930

934

931

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

935

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

932

if stopped:

936

if stopped:

933

basetext = self._revisioncache[2]

937

basetext = self._revisioncache[2]

934

938

935

# drop cache to save memory, the caller is expected to

939

# drop cache to save memory, the caller is expected to

936

# update self._inner._revisioncache after validating the text

940

# update self._inner._revisioncache after validating the text

937

self._revisioncache = None

941

self._revisioncache = None

938

942

939

targetsize = None

943

targetsize = None

940

rawsize = self.index[rev][2]

944

rawsize = self.index[rev][2]

941

if 0 <= rawsize:

945

if 0 <= rawsize:

942

targetsize = 4 * rawsize

946

targetsize = 4 * rawsize

943

947

944

bins = self._chunks(chain, targetsize=targetsize)

948

bins = self._chunks(chain, targetsize=targetsize)

945

if basetext is None:

949

if basetext is None:

946

basetext = bytes(bins[0])

950

basetext = bytes(bins[0])

947

bins = bins[1:]

951

bins = bins[1:]

948

952

949

rawtext = mdiff.patches(basetext, bins)

953

rawtext = mdiff.patches(basetext, bins)

950

del basetext # let us have a chance to free memory early

954

del basetext # let us have a chance to free memory early

951

return (rev, rawtext, False)

955

return (rev, rawtext, False)

952

956

953

def sidedata(self, rev, sidedata_end):

957

def sidedata(self, rev, sidedata_end):

954

"""Return the sidedata for a given revision number."""

958

"""Return the sidedata for a given revision number."""

955

index_entry = self.index[rev]

959

index_entry = self.index[rev]

956

sidedata_offset = index_entry[8]

960

sidedata_offset = index_entry[8]

957

sidedata_size = index_entry[9]

961

sidedata_size = index_entry[9]

958

962

959

if self.inline:

963

if self.inline:

960

sidedata_offset += self.index.entry_size * (1 + rev)

964

sidedata_offset += self.index.entry_size * (1 + rev)

961

if sidedata_size == 0:

965

if sidedata_size == 0:

962

return {}

966

return {}

963

967

964

if sidedata_end < sidedata_offset + sidedata_size:

968

if sidedata_end < sidedata_offset + sidedata_size:

965

filename = self.sidedata_file

969

filename = self.sidedata_file

966

end = sidedata_end

970

end = sidedata_end

967

offset = sidedata_offset

971

offset = sidedata_offset

968

length = sidedata_size

972

length = sidedata_size

969

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

973

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

970

raise error.RevlogError(m)

974

raise error.RevlogError(m)

971

975

972

comp_segment = self._segmentfile_sidedata.read_chunk(

976

comp_segment = self._segmentfile_sidedata.read_chunk(

973

sidedata_offset, sidedata_size

977

sidedata_offset, sidedata_size

974

)

978

)

975

979

976

comp = self.index[rev][11]

980

comp = self.index[rev][11]

977

if comp == COMP_MODE_PLAIN:

981

if comp == COMP_MODE_PLAIN:

978

segment = comp_segment

982

segment = comp_segment

979

elif comp == COMP_MODE_DEFAULT:

983

elif comp == COMP_MODE_DEFAULT:

980

segment = self._decompressor(comp_segment)

984

segment = self._decompressor(comp_segment)

981

elif comp == COMP_MODE_INLINE:

985

elif comp == COMP_MODE_INLINE:

982

segment = self.decompress(comp_segment)

986

segment = self.decompress(comp_segment)

983

else:

987

else:

984

msg = b'unknown compression mode %d'

988

msg = b'unknown compression mode %d'

985

msg %= comp

989

msg %= comp

986

raise error.RevlogError(msg)

990

raise error.RevlogError(msg)

987

991

988

sidedata = sidedatautil.deserialize_sidedata(segment)

992

sidedata = sidedatautil.deserialize_sidedata(segment)

989

return sidedata

993

return sidedata

990

994

991

def write_entry(

995

def write_entry(

992

self,

996

self,

993

transaction,

997

transaction,

994

entry,

998

entry,

995

data,

999

data,

996

link,

1000

link,

997

offset,

1001

offset,

998

sidedata,

1002

sidedata,

999

sidedata_offset,

1003

sidedata_offset,

1000

index_end,

1004

index_end,

1001

data_end,

1005

data_end,

1002

sidedata_end,

1006

sidedata_end,

1003

):

1007

):

1004

# Files opened in a+ mode have inconsistent behavior on various

1008

# Files opened in a+ mode have inconsistent behavior on various

1005

# platforms. Windows requires that a file positioning call be made

1009

# platforms. Windows requires that a file positioning call be made

1006

# when the file handle transitions between reads and writes. See

1010

# when the file handle transitions between reads and writes. See

1007

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

1011

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

1008

# platforms, Python or the platform itself can be buggy. Some versions

1012

# platforms, Python or the platform itself can be buggy. Some versions

1009

# of Solaris have been observed to not append at the end of the file

1013

# of Solaris have been observed to not append at the end of the file

1010

# if the file was seeked to before the end. See issue4943 for more.

1014

# if the file was seeked to before the end. See issue4943 for more.

1011

#

1015

#

1012

# We work around this issue by inserting a seek() before writing.

1016

# We work around this issue by inserting a seek() before writing.

1013

# Note: This is likely not necessary on Python 3. However, because

1017

# Note: This is likely not necessary on Python 3. However, because

1014

# the file handle is reused for reads and may be seeked there, we need

1018

# the file handle is reused for reads and may be seeked there, we need

1015

# to be careful before changing this.

1019

# to be careful before changing this.

1016

if self._writinghandles is None:

1020

if self._writinghandles is None:

1017

msg = b'adding revision outside `revlog._writing` context'

1021

msg = b'adding revision outside `revlog._writing` context'

1018

raise error.ProgrammingError(msg)

1022

raise error.ProgrammingError(msg)

1019

ifh, dfh, sdfh = self._writinghandles

1023

ifh, dfh, sdfh = self._writinghandles

1020

if index_end is None:

1024

if index_end is None:

1021

ifh.seek(0, os.SEEK_END)

1025

ifh.seek(0, os.SEEK_END)

1022

else:

1026

else:

1023

ifh.seek(index_end, os.SEEK_SET)

1027

ifh.seek(index_end, os.SEEK_SET)

1024

if dfh:

1028

if dfh:

1025

if data_end is None:

1029

if data_end is None:

1026

dfh.seek(0, os.SEEK_END)

1030

dfh.seek(0, os.SEEK_END)

1027

else:

1031

else:

1028

dfh.seek(data_end, os.SEEK_SET)

1032

dfh.seek(data_end, os.SEEK_SET)

1029

if sdfh:

1033

if sdfh:

1030

sdfh.seek(sidedata_end, os.SEEK_SET)

1034

sdfh.seek(sidedata_end, os.SEEK_SET)

1031

1035

1032

curr = len(self.index) - 1

1036

curr = len(self.index) - 1

1033

if not self.inline:

1037

if not self.inline:

1034

transaction.add(self.data_file, offset)

1038

transaction.add(self.data_file, offset)

1035

if self.sidedata_file:

1039

if self.sidedata_file:

1036

transaction.add(self.sidedata_file, sidedata_offset)

1040

transaction.add(self.sidedata_file, sidedata_offset)

1037

transaction.add(self.index_file, curr * len(entry))

1041

transaction.add(self.canonical_index_file, curr * len(entry))

1038

if data[0]:

1042

if data[0]:

1039

dfh.write(data[0])

1043

dfh.write(data[0])

1040

dfh.write(data[1])

1044

dfh.write(data[1])

1041

if sidedata:

1045

if sidedata:

1042

sdfh.write(sidedata)

1046

sdfh.write(sidedata)

1043

ifh.write(entry)

1047

ifh.write(entry)

1044

else:

1048

else:

1045

offset += curr * self.index.entry_size

1049

offset += curr * self.index.entry_size

1046

transaction.add(self.index_file, offset)

1050

transaction.add(self.canonical_index_file, offset)

1047

ifh.write(entry)

1051

ifh.write(entry)

1048

ifh.write(data[0])

1052

ifh.write(data[0])

1049

ifh.write(data[1])

1053

ifh.write(data[1])

1050

assert not sidedata

1054

assert not sidedata

1051

return (

1055

return (

1052

ifh.tell(),

1056

ifh.tell(),

1053

dfh.tell() if dfh else None,

1057

dfh.tell() if dfh else None,

1054

sdfh.tell() if sdfh else None,

1058

sdfh.tell() if sdfh else None,

1055

)

1059

)

1056

1060

1057

1061

1058

class revlog:

1062

class revlog:

1059

"""

1063

"""

1060

the underlying revision storage object

1064

the underlying revision storage object

1061

1065

1062

A revlog consists of two parts, an index and the revision data.

1066

A revlog consists of two parts, an index and the revision data.

1063

1067

1064

The index is a file with a fixed record size containing

1068

The index is a file with a fixed record size containing

1065

information on each revision, including its nodeid (hash), the

1069

information on each revision, including its nodeid (hash), the

1066

nodeids of its parents, the position and offset of its data within

1070

nodeids of its parents, the position and offset of its data within

1067

the data file, and the revision it's based on. Finally, each entry

1071

the data file, and the revision it's based on. Finally, each entry

1068

contains a linkrev entry that can serve as a pointer to external

1072

contains a linkrev entry that can serve as a pointer to external

1069

data.

1073

data.

1070

1074

1071

The revision data itself is a linear collection of data chunks.

1075

The revision data itself is a linear collection of data chunks.

1072

Each chunk represents a revision and is usually represented as a

1076

Each chunk represents a revision and is usually represented as a

1073

delta against the previous chunk. To bound lookup time, runs of

1077

delta against the previous chunk. To bound lookup time, runs of

1074

deltas are limited to about 2 times the length of the original

1078

deltas are limited to about 2 times the length of the original

1075

version data. This makes retrieval of a version proportional to

1079

version data. This makes retrieval of a version proportional to

1076

its size, or O(1) relative to the number of revisions.

1080

its size, or O(1) relative to the number of revisions.

1077

1081

1078

Both pieces of the revlog are written to in an append-only

1082

Both pieces of the revlog are written to in an append-only

1079

fashion, which means we never need to rewrite a file to insert or

1083

fashion, which means we never need to rewrite a file to insert or

1080

remove data, and can use some simple techniques to avoid the need

1084

remove data, and can use some simple techniques to avoid the need

1081

for locking while reading.

1085

for locking while reading.

1082

1086

1083

If checkambig, indexfile is opened with checkambig=True at

1087

If checkambig, indexfile is opened with checkambig=True at

1084

writing, to avoid file stat ambiguity.

1088

writing, to avoid file stat ambiguity.

1085

1089

1086

If mmaplargeindex is True, and an mmapindexthreshold is set, the

1090

If mmaplargeindex is True, and an mmapindexthreshold is set, the

1087

index will be mmapped rather than read if it is larger than the

1091

index will be mmapped rather than read if it is larger than the

1088

configured threshold.

1092

configured threshold.

1089

1093

1090

If censorable is True, the revlog can have censored revisions.

1094

If censorable is True, the revlog can have censored revisions.

1091

1095

1092

If `upperboundcomp` is not None, this is the expected maximal gain from

1096

If `upperboundcomp` is not None, this is the expected maximal gain from

1093

compression for the data content.

1097

compression for the data content.

1094

1098

1095

`concurrencychecker` is an optional function that receives 3 arguments: a

1099

`concurrencychecker` is an optional function that receives 3 arguments: a

1096

file handle, a filename, and an expected position. It should check whether

1100

file handle, a filename, and an expected position. It should check whether

1097

the current position in the file handle is valid, and log/warn/fail (by

1101

the current position in the file handle is valid, and log/warn/fail (by

1098

raising).

1102

raising).

1099

1103

1100

See mercurial/revlogutils/contants.py for details about the content of an

1104

See mercurial/revlogutils/contants.py for details about the content of an

1101

index entry.

1105

index entry.

1102

"""

1106

"""

1103

1107

1104

_flagserrorclass = error.RevlogError

1108

_flagserrorclass = error.RevlogError

1105

1109

1106

@staticmethod

1110

@staticmethod

1107

def is_inline_index(header_bytes):

1111

def is_inline_index(header_bytes):

1108

"""Determine if a revlog is inline from the initial bytes of the index"""

1112

"""Determine if a revlog is inline from the initial bytes of the index"""

1109

header = INDEX_HEADER.unpack(header_bytes)[0]

1113

header = INDEX_HEADER.unpack(header_bytes)[0]

1110

1114

1111

_format_flags = header & ~0xFFFF

1115

_format_flags = header & ~0xFFFF

1112

_format_version = header & 0xFFFF

1116

_format_version = header & 0xFFFF

1113

1117

1114

features = FEATURES_BY_VERSION[_format_version]

1118

features = FEATURES_BY_VERSION[_format_version]

1115

return features[b'inline'](_format_flags)

1119

return features[b'inline'](_format_flags)

1116

1120

1117

def __init__(

1121

def __init__(

1118

self,

1122

self,

1119

opener,

1123

opener,

1120

target,

1124

target,

1121

radix,

1125

radix,

1122

postfix=None, # only exist for `tmpcensored` now

1126

postfix=None, # only exist for `tmpcensored` now

1123

checkambig=False,

1127

checkambig=False,

1124

mmaplargeindex=False,

1128

mmaplargeindex=False,

1125

censorable=False,

1129

censorable=False,

1126

upperboundcomp=None,

1130

upperboundcomp=None,

1127

persistentnodemap=False,

1131

persistentnodemap=False,

1128

concurrencychecker=None,

1132

concurrencychecker=None,

1129

trypending=False,

1133

trypending=False,

1130

try_split=False,

1134

try_split=False,

1131

canonical_parent_order=True,

1135

canonical_parent_order=True,

1132

):

1136

):

1133

"""

1137

"""

1134

create a revlog object

1138

create a revlog object

1135

1139

1136

opener is a function that abstracts the file opening operation

1140

opener is a function that abstracts the file opening operation

1137

and can be used to implement COW semantics or the like.

1141

and can be used to implement COW semantics or the like.

1138

1142

1139

`target`: a (KIND, ID) tuple that identify the content stored in

1143

`target`: a (KIND, ID) tuple that identify the content stored in

1140

this revlog. It help the rest of the code to understand what the revlog

1144

this revlog. It help the rest of the code to understand what the revlog

1141

is about without having to resort to heuristic and index filename

1145

is about without having to resort to heuristic and index filename

1142

analysis. Note: that this must be reliably be set by normal code, but

1146

analysis. Note: that this must be reliably be set by normal code, but

1143

that test, debug, or performance measurement code might not set this to

1147

that test, debug, or performance measurement code might not set this to

1144

accurate value.

1148

accurate value.

1145

"""

1149

"""

1146

1150

1147

self.radix = radix

1151

self.radix = radix

1148

1152

1149

self._docket_file = None

1153

self._docket_file = None

1150

self._indexfile = None

1154

self._indexfile = None

1151

self._datafile = None

1155

self._datafile = None

1152

self._sidedatafile = None

1156

self._sidedatafile = None

1153

self._nodemap_file = None

1157

self._nodemap_file = None

1154

self.postfix = postfix

1158

self.postfix = postfix

1155

self._trypending = trypending

1159

self._trypending = trypending

1156

self._try_split = try_split

1160

self._try_split = try_split

1157

self.opener = opener

1161

self.opener = opener

1158

if persistentnodemap:

1162

if persistentnodemap:

1159

self._nodemap_file = nodemaputil.get_nodemap_file(self)

1163

self._nodemap_file = nodemaputil.get_nodemap_file(self)

1160

1164

1161

assert target[0] in ALL_KINDS

1165

assert target[0] in ALL_KINDS

1162

assert len(target) == 2

1166

assert len(target) == 2

1163

self.target = target

1167

self.target = target

1164

if b'feature-config' in self.opener.options:

1168

if b'feature-config' in self.opener.options:

1165

self.feature_config = self.opener.options[b'feature-config'].copy()

1169

self.feature_config = self.opener.options[b'feature-config'].copy()

1166

else:

1170

else:

1167

self.feature_config = FeatureConfig()

1171

self.feature_config = FeatureConfig()

1168

self.feature_config.censorable = censorable

1172

self.feature_config.censorable = censorable

1169

self.feature_config.canonical_parent_order = canonical_parent_order

1173

self.feature_config.canonical_parent_order = canonical_parent_order

1170

if b'data-config' in self.opener.options:

1174

if b'data-config' in self.opener.options:

1171

self.data_config = self.opener.options[b'data-config'].copy()

1175

self.data_config = self.opener.options[b'data-config'].copy()

1172

else:

1176

else:

1173

self.data_config = DataConfig()

1177

self.data_config = DataConfig()

1174

self.data_config.check_ambig = checkambig

1178

self.data_config.check_ambig = checkambig

1175

self.data_config.mmap_large_index = mmaplargeindex

1179

self.data_config.mmap_large_index = mmaplargeindex

1176

if b'delta-config' in self.opener.options:

1180

if b'delta-config' in self.opener.options:

1177

self.delta_config = self.opener.options[b'delta-config'].copy()

1181

self.delta_config = self.opener.options[b'delta-config'].copy()

1178

else:

1182

else:

1179

self.delta_config = DeltaConfig()

1183

self.delta_config = DeltaConfig()

1180

self.delta_config.upper_bound_comp = upperboundcomp

1184

self.delta_config.upper_bound_comp = upperboundcomp

1181

1185

1182

# Maps rev to chain base rev.

1186

# Maps rev to chain base rev.

1183

self._chainbasecache = util.lrucachedict(100)

1187

self._chainbasecache = util.lrucachedict(100)

1184

1188

1185

self.index = None

1189

self.index = None

1186

self._docket = None

1190

self._docket = None

1187

self._nodemap_docket = None

1191

self._nodemap_docket = None

1188

# Mapping of partial identifiers to full nodes.

1192

# Mapping of partial identifiers to full nodes.

1189

self._pcache = {}

1193

self._pcache = {}

1190

1194

1191

# other optionnals features

1195

# other optionnals features

1192

1196

1193

# Make copy of flag processors so each revlog instance can support

1197

# Make copy of flag processors so each revlog instance can support

1194

# custom flags.

1198

# custom flags.

1195

self._flagprocessors = dict(flagutil.flagprocessors)

1199

self._flagprocessors = dict(flagutil.flagprocessors)

1196

# prevent nesting of addgroup

1200

# prevent nesting of addgroup

1197

self._adding_group = None

1201

self._adding_group = None

1198

1202

1199

chunk_cache = self._loadindex()

1203

chunk_cache = self._loadindex()

1200

self._load_inner(chunk_cache)

1204

self._load_inner(chunk_cache)

1201

self._concurrencychecker = concurrencychecker

1205

self._concurrencychecker = concurrencychecker

1202

1206

1203

@property

1207

@property

1204

def _generaldelta(self):

1208

def _generaldelta(self):

1205

"""temporary compatibility proxy"""

1209

"""temporary compatibility proxy"""

1206

util.nouideprecwarn(

1210

util.nouideprecwarn(

1207

b"use revlog.delta_config.general_delta", b"6.6", stacklevel=2

1211

b"use revlog.delta_config.general_delta", b"6.6", stacklevel=2

1208

)

1212

)

1209

return self.delta_config.general_delta

1213

return self.delta_config.general_delta

1210

1214

1211

@property

1215

@property

1212

def _checkambig(self):

1216

def _checkambig(self):

1213

"""temporary compatibility proxy"""

1217

"""temporary compatibility proxy"""

1214

util.nouideprecwarn(

1218

util.nouideprecwarn(

1215

b"use revlog.data_config.checkambig", b"6.6", stacklevel=2

1219

b"use revlog.data_config.checkambig", b"6.6", stacklevel=2

1216

)

1220

)

1217

return self.data_config.check_ambig

1221

return self.data_config.check_ambig

1218

1222

1219

@property

1223

@property

1220

def _mmaplargeindex(self):

1224

def _mmaplargeindex(self):

1221

"""temporary compatibility proxy"""

1225

"""temporary compatibility proxy"""

1222

util.nouideprecwarn(

1226

util.nouideprecwarn(

1223

b"use revlog.data_config.mmap_large_index", b"6.6", stacklevel=2

1227

b"use revlog.data_config.mmap_large_index", b"6.6", stacklevel=2

1224

)

1228

)

1225

return self.data_config.mmap_large_index

1229

return self.data_config.mmap_large_index

1226

1230

1227

@property

1231

@property

1228

def _censorable(self):

1232

def _censorable(self):

1229

"""temporary compatibility proxy"""

1233

"""temporary compatibility proxy"""

1230

util.nouideprecwarn(

1234

util.nouideprecwarn(

1231

b"use revlog.feature_config.censorable", b"6.6", stacklevel=2

1235

b"use revlog.feature_config.censorable", b"6.6", stacklevel=2

1232

)

1236

)

1233

return self.feature_config.censorable

1237

return self.feature_config.censorable

1234

1238

1235

@property

1239

@property

1236

def _chunkcachesize(self):

1240

def _chunkcachesize(self):

1237

"""temporary compatibility proxy"""

1241

"""temporary compatibility proxy"""

1238

util.nouideprecwarn(

1242

util.nouideprecwarn(

1239

b"use revlog.data_config.chunk_cache_size", b"6.6", stacklevel=2

1243

b"use revlog.data_config.chunk_cache_size", b"6.6", stacklevel=2

1240

)

1244

)

1241

return self.data_config.chunk_cache_size

1245

return self.data_config.chunk_cache_size

1242

1246

1243

@property

1247

@property

1244

def _maxchainlen(self):

1248

def _maxchainlen(self):

1245

"""temporary compatibility proxy"""

1249

"""temporary compatibility proxy"""

1246

util.nouideprecwarn(

1250

util.nouideprecwarn(

1247

b"use revlog.delta_config.max_chain_len", b"6.6", stacklevel=2

1251

b"use revlog.delta_config.max_chain_len", b"6.6", stacklevel=2

1248

)

1252

)

1249

return self.delta_config.max_chain_len

1253

return self.delta_config.max_chain_len

1250

1254

1251

@property

1255

@property

1252

def _deltabothparents(self):

1256

def _deltabothparents(self):

1253

"""temporary compatibility proxy"""

1257

"""temporary compatibility proxy"""

1254

util.nouideprecwarn(

1258

util.nouideprecwarn(

1255

b"use revlog.delta_config.delta_both_parents", b"6.6", stacklevel=2

1259

b"use revlog.delta_config.delta_both_parents", b"6.6", stacklevel=2

1256

)

1260

)

1257

return self.delta_config.delta_both_parents

1261

return self.delta_config.delta_both_parents

1258

1262

1259

@property

1263

@property

1260

def _candidate_group_chunk_size(self):

1264

def _candidate_group_chunk_size(self):

1261

"""temporary compatibility proxy"""

1265

"""temporary compatibility proxy"""

1262

util.nouideprecwarn(

1266

util.nouideprecwarn(

1263

b"use revlog.delta_config.candidate_group_chunk_size",

1267

b"use revlog.delta_config.candidate_group_chunk_size",

1264

b"6.6",

1268

b"6.6",

1265

stacklevel=2,

1269

stacklevel=2,

1266

)

1270

)

1267

return self.delta_config.candidate_group_chunk_size

1271

return self.delta_config.candidate_group_chunk_size

1268

1272

1269

@property

1273

@property

1270

def _debug_delta(self):

1274

def _debug_delta(self):

1271

"""temporary compatibility proxy"""

1275

"""temporary compatibility proxy"""

1272

util.nouideprecwarn(

1276

util.nouideprecwarn(

1273

b"use revlog.delta_config.debug_delta", b"6.6", stacklevel=2

1277

b"use revlog.delta_config.debug_delta", b"6.6", stacklevel=2

1274

)

1278

)

1275

return self.delta_config.debug_delta

1279

return self.delta_config.debug_delta

1276

1280

1277

@property

1281

@property

1278

def _compengine(self):

1282

def _compengine(self):

1279

"""temporary compatibility proxy"""

1283

"""temporary compatibility proxy"""

1280

util.nouideprecwarn(

1284

util.nouideprecwarn(

1281

b"use revlog.feature_config.compression_engine",

1285

b"use revlog.feature_config.compression_engine",

1282

b"6.6",

1286

b"6.6",

1283

stacklevel=2,

1287

stacklevel=2,

1284

)

1288

)

1285

return self.feature_config.compression_engine

1289

return self.feature_config.compression_engine

1286

1290

1287

@property

1291

@property

1288

def upperboundcomp(self):

1292

def upperboundcomp(self):

1289

"""temporary compatibility proxy"""

1293

"""temporary compatibility proxy"""

1290

util.nouideprecwarn(

1294

util.nouideprecwarn(

1291

b"use revlog.delta_config.upper_bound_comp",

1295

b"use revlog.delta_config.upper_bound_comp",

1292

b"6.6",

1296

b"6.6",

1293

stacklevel=2,

1297

stacklevel=2,

1294

)

1298

)

1295

return self.delta_config.upper_bound_comp

1299

return self.delta_config.upper_bound_comp

1296

1300

1297

@property

1301

@property

1298

def _compengineopts(self):

1302

def _compengineopts(self):

1299

"""temporary compatibility proxy"""

1303

"""temporary compatibility proxy"""

1300

util.nouideprecwarn(

1304

util.nouideprecwarn(

1301

b"use revlog.feature_config.compression_engine_options",

1305

b"use revlog.feature_config.compression_engine_options",

1302

b"6.6",

1306

b"6.6",

1303

stacklevel=2,

1307

stacklevel=2,

1304

)

1308

)

1305

return self.feature_config.compression_engine_options

1309

return self.feature_config.compression_engine_options

1306

1310

1307

@property

1311

@property

1308

def _maxdeltachainspan(self):

1312

def _maxdeltachainspan(self):

1309

"""temporary compatibility proxy"""

1313

"""temporary compatibility proxy"""

1310

util.nouideprecwarn(

1314

util.nouideprecwarn(

1311

b"use revlog.delta_config.max_deltachain_span", b"6.6", stacklevel=2

1315

b"use revlog.delta_config.max_deltachain_span", b"6.6", stacklevel=2

1312

)

1316

)

1313

return self.delta_config.max_deltachain_span

1317

return self.delta_config.max_deltachain_span

1314

1318

1315

@property

1319

@property

1316

def _withsparseread(self):

1320

def _withsparseread(self):

1317

"""temporary compatibility proxy"""

1321

"""temporary compatibility proxy"""

1318

util.nouideprecwarn(

1322

util.nouideprecwarn(

1319

b"use revlog.data_config.with_sparse_read", b"6.6", stacklevel=2

1323

b"use revlog.data_config.with_sparse_read", b"6.6", stacklevel=2

1320

)

1324

)

1321

return self.data_config.with_sparse_read

1325

return self.data_config.with_sparse_read

1322

1326

1323

@property

1327

@property

1324

def _sparserevlog(self):

1328

def _sparserevlog(self):

1325

"""temporary compatibility proxy"""

1329

"""temporary compatibility proxy"""

1326

util.nouideprecwarn(

1330

util.nouideprecwarn(

1327

b"use revlog.delta_config.sparse_revlog", b"6.6", stacklevel=2

1331

b"use revlog.delta_config.sparse_revlog", b"6.6", stacklevel=2

1328

)

1332

)

1329

return self.delta_config.sparse_revlog

1333

return self.delta_config.sparse_revlog

1330

1334

1331

@property

1335

@property

1332

def hassidedata(self):

1336

def hassidedata(self):

1333

"""temporary compatibility proxy"""

1337

"""temporary compatibility proxy"""

1334

util.nouideprecwarn(

1338

util.nouideprecwarn(

1335

b"use revlog.feature_config.has_side_data", b"6.6", stacklevel=2

1339

b"use revlog.feature_config.has_side_data", b"6.6", stacklevel=2

1336

)

1340

)

1337

return self.feature_config.has_side_data

1341

return self.feature_config.has_side_data

1338

1342

1339

@property

1343

@property

1340

def _srdensitythreshold(self):

1344

def _srdensitythreshold(self):

1341

"""temporary compatibility proxy"""

1345

"""temporary compatibility proxy"""

1342

util.nouideprecwarn(

1346

util.nouideprecwarn(

1343

b"use revlog.data_config.sr_density_threshold",

1347

b"use revlog.data_config.sr_density_threshold",

1344

b"6.6",

1348

b"6.6",

1345

stacklevel=2,

1349

stacklevel=2,

1346

)

1350

)

1347

return self.data_config.sr_density_threshold

1351

return self.data_config.sr_density_threshold

1348

1352

1349

@property

1353

@property

1350

def _srmingapsize(self):

1354

def _srmingapsize(self):

1351

"""temporary compatibility proxy"""

1355

"""temporary compatibility proxy"""

1352

util.nouideprecwarn(

1356

util.nouideprecwarn(

1353

b"use revlog.data_config.sr_min_gap_size", b"6.6", stacklevel=2

1357

b"use revlog.data_config.sr_min_gap_size", b"6.6", stacklevel=2

1354

)

1358

)

1355

return self.data_config.sr_min_gap_size

1359

return self.data_config.sr_min_gap_size

1356

1360

1357

@property

1361

@property

1358

def _compute_rank(self):

1362

def _compute_rank(self):

1359

"""temporary compatibility proxy"""

1363

"""temporary compatibility proxy"""

1360

util.nouideprecwarn(

1364

util.nouideprecwarn(

1361

b"use revlog.feature_config.compute_rank", b"6.6", stacklevel=2

1365

b"use revlog.feature_config.compute_rank", b"6.6", stacklevel=2

1362

)

1366

)

1363

return self.feature_config.compute_rank

1367

return self.feature_config.compute_rank

1364

1368

1365

@property

1369

@property

1366

def canonical_parent_order(self):

1370

def canonical_parent_order(self):

1367

"""temporary compatibility proxy"""

1371

"""temporary compatibility proxy"""

1368

util.nouideprecwarn(

1372

util.nouideprecwarn(

1369

b"use revlog.feature_config.canonical_parent_order",

1373

b"use revlog.feature_config.canonical_parent_order",

1370

b"6.6",

1374

b"6.6",

1371

stacklevel=2,

1375

stacklevel=2,

1372

)

1376

)

1373

return self.feature_config.canonical_parent_order

1377

return self.feature_config.canonical_parent_order

1374

1378

1375

@property

1379

@property

1376

def _lazydelta(self):

1380

def _lazydelta(self):

1377

"""temporary compatibility proxy"""

1381

"""temporary compatibility proxy"""

1378

util.nouideprecwarn(

1382

util.nouideprecwarn(

1379

b"use revlog.delta_config.lazy_delta", b"6.6", stacklevel=2

1383

b"use revlog.delta_config.lazy_delta", b"6.6", stacklevel=2

1380

)

1384

)

1381

return self.delta_config.lazy_delta

1385

return self.delta_config.lazy_delta

1382

1386

1383

@property

1387

@property

1384

def _lazydeltabase(self):

1388

def _lazydeltabase(self):

1385

"""temporary compatibility proxy"""

1389

"""temporary compatibility proxy"""

1386

util.nouideprecwarn(

1390

util.nouideprecwarn(

1387

b"use revlog.delta_config.lazy_delta_base", b"6.6", stacklevel=2

1391

b"use revlog.delta_config.lazy_delta_base", b"6.6", stacklevel=2

1388

)

1392

)

1389

return self.delta_config.lazy_delta_base

1393

return self.delta_config.lazy_delta_base

1390

1394

1391

def _init_opts(self):

1395

def _init_opts(self):

1392

"""process options (from above/config) to setup associated default revlog mode

1396

"""process options (from above/config) to setup associated default revlog mode

1393

1397

1394

These values might be affected when actually reading on disk information.

1398

These values might be affected when actually reading on disk information.

1395

1399

1396

The relevant values are returned for use in _loadindex().

1400

The relevant values are returned for use in _loadindex().

1397

1401

1398

* newversionflags:

1402

* newversionflags:

1399

version header to use if we need to create a new revlog

1403

version header to use if we need to create a new revlog

1400

1404

1401

* mmapindexthreshold:

1405

* mmapindexthreshold:

1402

minimal index size for start to use mmap

1406

minimal index size for start to use mmap

1403

1407

1404

* force_nodemap:

1408

* force_nodemap:

1405

force the usage of a "development" version of the nodemap code

1409

force the usage of a "development" version of the nodemap code

1406

"""

1410

"""

1407

opts = self.opener.options

1411

opts = self.opener.options

1408

1412

1409

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

1413

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

1410

new_header = CHANGELOGV2

1414

new_header = CHANGELOGV2

1411

compute_rank = opts.get(b'changelogv2.compute-rank', True)

1415

compute_rank = opts.get(b'changelogv2.compute-rank', True)

1412

self.feature_config.compute_rank = compute_rank

1416

self.feature_config.compute_rank = compute_rank

1413

elif b'revlogv2' in opts:

1417

elif b'revlogv2' in opts:

1414

new_header = REVLOGV2

1418

new_header = REVLOGV2

1415

elif b'revlogv1' in opts:

1419

elif b'revlogv1' in opts:

1416

new_header = REVLOGV1 | FLAG_INLINE_DATA

1420

new_header = REVLOGV1 | FLAG_INLINE_DATA

1417

if b'generaldelta' in opts:

1421

if b'generaldelta' in opts:

1418

new_header |= FLAG_GENERALDELTA

1422

new_header |= FLAG_GENERALDELTA

1419

elif b'revlogv0' in self.opener.options:

1423

elif b'revlogv0' in self.opener.options:

1420

new_header = REVLOGV0

1424

new_header = REVLOGV0

1421

else:

1425

else:

1422

new_header = REVLOG_DEFAULT_VERSION

1426

new_header = REVLOG_DEFAULT_VERSION

1423

1427

1424

mmapindexthreshold = None

1428

mmapindexthreshold = None

1425

if self.data_config.mmap_large_index:

1429

if self.data_config.mmap_large_index:

1426

mmapindexthreshold = self.data_config.mmap_index_threshold

1430

mmapindexthreshold = self.data_config.mmap_index_threshold

1427

if self.feature_config.enable_ellipsis:

1431

if self.feature_config.enable_ellipsis:

1428

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

1432

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

1429

1433

1430

# revlog v0 doesn't have flag processors

1434

# revlog v0 doesn't have flag processors

1431

for flag, processor in opts.get(b'flagprocessors', {}).items():

1435

for flag, processor in opts.get(b'flagprocessors', {}).items():

1432

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

1436

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

1433

1437

1434

chunk_cache_size = self.data_config.chunk_cache_size

1438

chunk_cache_size = self.data_config.chunk_cache_size

1435

if chunk_cache_size <= 0:

1439

if chunk_cache_size <= 0:

1436

raise error.RevlogError(

1440

raise error.RevlogError(

1437

_(b'revlog chunk cache size %r is not greater than 0')

1441

_(b'revlog chunk cache size %r is not greater than 0')

1438

% chunk_cache_size

1442

% chunk_cache_size

1439

)

1443

)

1440

elif chunk_cache_size & (chunk_cache_size - 1):

1444

elif chunk_cache_size & (chunk_cache_size - 1):

1441

raise error.RevlogError(

1445

raise error.RevlogError(

1442

_(b'revlog chunk cache size %r is not a power of 2')

1446

_(b'revlog chunk cache size %r is not a power of 2')

1443

% chunk_cache_size

1447

% chunk_cache_size

1444

)

1448

)

1445

force_nodemap = opts.get(b'devel-force-nodemap', False)

1449

force_nodemap = opts.get(b'devel-force-nodemap', False)

1446

return new_header, mmapindexthreshold, force_nodemap

1450

return new_header, mmapindexthreshold, force_nodemap

1447

1451

1448

def _get_data(self, filepath, mmap_threshold, size=None):

1452

def _get_data(self, filepath, mmap_threshold, size=None):

1449

"""return a file content with or without mmap

1453

"""return a file content with or without mmap

1450

1454

1451

If the file is missing return the empty string"""

1455

If the file is missing return the empty string"""

1452

try:

1456

try:

1453

with self.opener(filepath) as fp:

1457

with self.opener(filepath) as fp:

1454

if mmap_threshold is not None:

1458

if mmap_threshold is not None:

1455

file_size = self.opener.fstat(fp).st_size

1459

file_size = self.opener.fstat(fp).st_size

1456

if file_size >= mmap_threshold:

1460

if file_size >= mmap_threshold:

1457

if size is not None:

1461

if size is not None:

1458

# avoid potentiel mmap crash

1462

# avoid potentiel mmap crash

1459

size = min(file_size, size)

1463

size = min(file_size, size)

1460

# TODO: should .close() to release resources without

1464

# TODO: should .close() to release resources without

1461

# relying on Python GC

1465

# relying on Python GC

1462

if size is None:

1466

if size is None:

1463

return util.buffer(util.mmapread(fp))

1467

return util.buffer(util.mmapread(fp))

1464

else:

1468

else:

1465

return util.buffer(util.mmapread(fp, size))

1469

return util.buffer(util.mmapread(fp, size))

1466

if size is None:

1470

if size is None:

1467

return fp.read()

1471

return fp.read()

1468

else:

1472

else:

1469

return fp.read(size)

1473

return fp.read(size)

1470

except FileNotFoundError:

1474

except FileNotFoundError:

1471

return b''

1475

return b''

1472

1476

1473

def get_streams(self, max_linkrev, force_inline=False):

1477

def get_streams(self, max_linkrev, force_inline=False):

1474

"""return a list of streams that represent this revlog

1478

"""return a list of streams that represent this revlog

1475

1479

1476

This is used by stream-clone to do bytes to bytes copies of a repository.

1480

This is used by stream-clone to do bytes to bytes copies of a repository.

1477

1481

1478

This streams data for all revisions that refer to a changelog revision up

1482

This streams data for all revisions that refer to a changelog revision up

1479

to `max_linkrev`.

1483

to `max_linkrev`.

1480

1484

1481

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

1485

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

1482

1486

1483

It returns is a list of three-tuple:

1487

It returns is a list of three-tuple:

1484

1488

1485

[

1489

[

1486

(filename, bytes_stream, stream_size),

1490

(filename, bytes_stream, stream_size),

1487

…

1491

…

1488

]

1492

]

1489

"""

1493

"""

1490

n = len(self)

1494

n = len(self)

1491

index = self.index

1495

index = self.index

1492

while n > 0:

1496

while n > 0:

1493

linkrev = index[n - 1][4]

1497

linkrev = index[n - 1][4]

1494

if linkrev < max_linkrev:

1498

if linkrev < max_linkrev:

1495

break

1499

break

1496

# note: this loop will rarely go through multiple iterations, since

1500

# note: this loop will rarely go through multiple iterations, since

1497

# it only traverses commits created during the current streaming

1501

# it only traverses commits created during the current streaming

1498

# pull operation.

1502

# pull operation.

1499

#

1503

#

1500

# If this become a problem, using a binary search should cap the

1504

# If this become a problem, using a binary search should cap the

1501

# runtime of this.

1505

# runtime of this.

1502

n = n - 1

1506

n = n - 1

1503

if n == 0:

1507

if n == 0:

1504

# no data to send

1508

# no data to send

1505

return []

1509

return []

1506

index_size = n * index.entry_size

1510

index_size = n * index.entry_size

1507

data_size = self.end(n - 1)

1511

data_size = self.end(n - 1)

1508

1512

1509

# XXX we might have been split (or stripped) since the object

1513

# XXX we might have been split (or stripped) since the object

1510

# initialization, We need to close this race too, but having a way to

1514

# initialization, We need to close this race too, but having a way to

1511

# pre-open the file we feed to the revlog and never closing them before

1515

# pre-open the file we feed to the revlog and never closing them before

1512

# we are done streaming.

1516

# we are done streaming.

1513

1517

1514

if self._inline:

1518

if self._inline:

1515

1519

1516

def get_stream():

1520

def get_stream():

1517

with self.opener(self._indexfile, mode=b"r") as fp:

1521

with self.opener(self._indexfile, mode=b"r") as fp:

1518

yield None

1522

yield None

1519

size = index_size + data_size

1523

size = index_size + data_size

1520

if size <= 65536:

1524

if size <= 65536:

1521

yield fp.read(size)

1525

yield fp.read(size)

1522

else:

1526

else:

1523

yield from util.filechunkiter(fp, limit=size)

1527

yield from util.filechunkiter(fp, limit=size)

1524

1528

1525

inline_stream = get_stream()

1529

inline_stream = get_stream()

1526

next(inline_stream)

1530

next(inline_stream)

1527

return [

1531

return [

1528

(self._indexfile, inline_stream, index_size + data_size),

1532

(self._indexfile, inline_stream, index_size + data_size),

1529

]

1533

]

1530

elif force_inline:

1534

elif force_inline:

1531

1535

1532

def get_stream():

1536

def get_stream():

1533

with self.reading():

1537

with self.reading():

1534

yield None

1538

yield None

1535

1539

1536

for rev in range(n):

1540

for rev in range(n):

1537

idx = self.index.entry_binary(rev)

1541

idx = self.index.entry_binary(rev)

1538

if rev == 0 and self._docket is None:

1542

if rev == 0 and self._docket is None:

1539

# re-inject the inline flag

1543

# re-inject the inline flag

1540

header = self._format_flags

1544

header = self._format_flags

1541

header |= self._format_version

1545

header |= self._format_version

1542

header |= FLAG_INLINE_DATA

1546

header |= FLAG_INLINE_DATA

1543

header = self.index.pack_header(header)

1547

header = self.index.pack_header(header)

1544

idx = header + idx

1548

idx = header + idx

1545

yield idx

1549

yield idx

1546

yield self._inner.get_segment_for_revs(rev, rev)[1]

1550

yield self._inner.get_segment_for_revs(rev, rev)[1]

1547

1551

1548

inline_stream = get_stream()

1552

inline_stream = get_stream()

1549

next(inline_stream)

1553

next(inline_stream)

1550

return [

1554

return [

1551

(self._indexfile, inline_stream, index_size + data_size),

1555

(self._indexfile, inline_stream, index_size + data_size),

1552

]

1556

]

1553

else:

1557

else:

1554

1558

1555

def get_index_stream():

1559

def get_index_stream():

1556

with self.opener(self._indexfile, mode=b"r") as fp:

1560

with self.opener(self._indexfile, mode=b"r") as fp:

1557

yield None

1561

yield None

1558

if index_size <= 65536:

1562

if index_size <= 65536:

1559

yield fp.read(index_size)

1563

yield fp.read(index_size)

1560

else:

1564

else:

1561

yield from util.filechunkiter(fp, limit=index_size)

1565

yield from util.filechunkiter(fp, limit=index_size)

1562

1566

1563

def get_data_stream():

1567

def get_data_stream():

1564

with self._datafp() as fp:

1568

with self._datafp() as fp:

1565

yield None

1569

yield None

1566

if data_size <= 65536:

1570

if data_size <= 65536:

1567

yield fp.read(data_size)

1571

yield fp.read(data_size)

1568

else:

1572

else:

1569

yield from util.filechunkiter(fp, limit=data_size)

1573

yield from util.filechunkiter(fp, limit=data_size)

1570

1574

1571

index_stream = get_index_stream()

1575

index_stream = get_index_stream()

1572

next(index_stream)

1576

next(index_stream)

1573

data_stream = get_data_stream()

1577

data_stream = get_data_stream()

1574

next(data_stream)

1578

next(data_stream)

1575

return [

1579

return [

1576

(self._datafile, data_stream, data_size),

1580

(self._datafile, data_stream, data_size),

1577

(self._indexfile, index_stream, index_size),

1581

(self._indexfile, index_stream, index_size),

1578

]

1582

]

1579

1583

1580

def _loadindex(self, docket=None):

1584

def _loadindex(self, docket=None):

1581

1585

1582

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

1586

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

1583

1587

1584

if self.postfix is not None:

1588

if self.postfix is not None:

1585

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

1589

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

1586

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

1590

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

1587

entry_point = b'%s.i.a' % self.radix

1591

entry_point = b'%s.i.a' % self.radix

1588

elif self._try_split and self.opener.exists(self._split_index_file):

1592

elif self._try_split and self.opener.exists(self._split_index_file):

1589

entry_point = self._split_index_file

1593

entry_point = self._split_index_file

1590

else:

1594

else:

1591

entry_point = b'%s.i' % self.radix

1595

entry_point = b'%s.i' % self.radix

1592

1596

1593

if docket is not None:

1597

if docket is not None:

1594

self._docket = docket

1598

self._docket = docket

1595

self._docket_file = entry_point

1599

self._docket_file = entry_point

1596

else:

1600

else:

1597

self._initempty = True

1601

self._initempty = True

1598

entry_data = self._get_data(entry_point, mmapindexthreshold)

1602

entry_data = self._get_data(entry_point, mmapindexthreshold)

1599

if len(entry_data) > 0:

1603

if len(entry_data) > 0:

1600

header = INDEX_HEADER.unpack(entry_data[:4])[0]

1604

header = INDEX_HEADER.unpack(entry_data[:4])[0]

1601

self._initempty = False

1605

self._initempty = False

1602

else:

1606

else:

1603

header = new_header

1607

header = new_header

1604

1608

1605

self._format_flags = header & ~0xFFFF

1609

self._format_flags = header & ~0xFFFF

1606

self._format_version = header & 0xFFFF

1610

self._format_version = header & 0xFFFF

1607

1611

1608

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

1612

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

1609

if supported_flags is None:

1613

if supported_flags is None:

1610

msg = _(b'unknown version (%d) in revlog %s')

1614

msg = _(b'unknown version (%d) in revlog %s')

1611

msg %= (self._format_version, self.display_id)

1615

msg %= (self._format_version, self.display_id)

1612

raise error.RevlogError(msg)

1616

raise error.RevlogError(msg)

1613

elif self._format_flags & ~supported_flags:

1617

elif self._format_flags & ~supported_flags:

1614

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

1618

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

1615

display_flag = self._format_flags >> 16

1619

display_flag = self._format_flags >> 16

1616

msg %= (display_flag, self._format_version, self.display_id)

1620

msg %= (display_flag, self._format_version, self.display_id)

1617

raise error.RevlogError(msg)

1621

raise error.RevlogError(msg)

1618

1622

1619

features = FEATURES_BY_VERSION[self._format_version]

1623

features = FEATURES_BY_VERSION[self._format_version]

1620

self._inline = features[b'inline'](self._format_flags)

1624

self._inline = features[b'inline'](self._format_flags)

1621

self.delta_config.general_delta = features[b'generaldelta'](

1625

self.delta_config.general_delta = features[b'generaldelta'](

1622

self._format_flags

1626

self._format_flags

1623

)

1627

)

1624

self.feature_config.has_side_data = features[b'sidedata']

1628

self.feature_config.has_side_data = features[b'sidedata']

1625

1629

1626

if not features[b'docket']:

1630

if not features[b'docket']:

1627

self._indexfile = entry_point

1631

self._indexfile = entry_point

1628

index_data = entry_data

1632

index_data = entry_data

1629

else:

1633

else:

1630

self._docket_file = entry_point

1634

self._docket_file = entry_point

1631

if self._initempty:

1635

if self._initempty:

1632

self._docket = docketutil.default_docket(self, header)

1636

self._docket = docketutil.default_docket(self, header)

1633

else:

1637

else:

1634

self._docket = docketutil.parse_docket(

1638

self._docket = docketutil.parse_docket(

1635

self, entry_data, use_pending=self._trypending

1639

self, entry_data, use_pending=self._trypending

1636

)

1640

)

1637

1641

1638

if self._docket is not None:

1642

if self._docket is not None:

1639

self._indexfile = self._docket.index_filepath()

1643

self._indexfile = self._docket.index_filepath()

1640

index_data = b''

1644

index_data = b''

1641

index_size = self._docket.index_end

1645

index_size = self._docket.index_end

1642

if index_size > 0:

1646

if index_size > 0:

1643

index_data = self._get_data(

1647

index_data = self._get_data(

1644

self._indexfile, mmapindexthreshold, size=index_size

1648

self._indexfile, mmapindexthreshold, size=index_size

1645

)

1649

)

1646

if len(index_data) < index_size:

1650

if len(index_data) < index_size:

1647

msg = _(b'too few index data for %s: got %d, expected %d')

1651

msg = _(b'too few index data for %s: got %d, expected %d')

1648

msg %= (self.display_id, len(index_data), index_size)

1652

msg %= (self.display_id, len(index_data), index_size)

1649

raise error.RevlogError(msg)

1653

raise error.RevlogError(msg)

1650

1654

1651

self._inline = False

1655

self._inline = False

1652

# generaldelta implied by version 2 revlogs.

1656

# generaldelta implied by version 2 revlogs.

1653

self.delta_config.general_delta = True

1657

self.delta_config.general_delta = True

1654

# the logic for persistent nodemap will be dealt with within the

1658

# the logic for persistent nodemap will be dealt with within the

1655

# main docket, so disable it for now.

1659

# main docket, so disable it for now.

1656

self._nodemap_file = None

1660

self._nodemap_file = None

1657

1661

1658

if self._docket is not None:

1662

if self._docket is not None:

1659

self._datafile = self._docket.data_filepath()

1663

self._datafile = self._docket.data_filepath()

1660

self._sidedatafile = self._docket.sidedata_filepath()

1664

self._sidedatafile = self._docket.sidedata_filepath()

1661

elif self.postfix is None:

1665

elif self.postfix is None:

1662

self._datafile = b'%s.d' % self.radix

1666

self._datafile = b'%s.d' % self.radix

1663

else:

1667

else:

1664

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

1668

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

1665

1669

1666

self.nodeconstants = sha1nodeconstants

1670

self.nodeconstants = sha1nodeconstants

1667

self.nullid = self.nodeconstants.nullid

1671

self.nullid = self.nodeconstants.nullid

1668

1672

1669

# sparse-revlog can't be on without general-delta (issue6056)

1673

# sparse-revlog can't be on without general-delta (issue6056)

1670

if not self.delta_config.general_delta:

1674

if not self.delta_config.general_delta:

1671

self.delta_config.sparse_revlog = False

1675

self.delta_config.sparse_revlog = False

1672

1676

1673

self._storedeltachains = True

1677

self._storedeltachains = True

1674

1678

1675

devel_nodemap = (

1679

devel_nodemap = (

1676

self._nodemap_file

1680

self._nodemap_file

1677

and force_nodemap

1681

and force_nodemap

1678

and parse_index_v1_nodemap is not None

1682

and parse_index_v1_nodemap is not None

1679

)

1683

)

1680

1684

1681

use_rust_index = False

1685

use_rust_index = False

1682

if rustrevlog is not None:

1686

if rustrevlog is not None:

1683

if self._nodemap_file is not None:

1687

if self._nodemap_file is not None:

1684

use_rust_index = True

1688

use_rust_index = True

1685

else:

1689

else:

1686

use_rust_index = self.opener.options.get(b'rust.index')

1690

use_rust_index = self.opener.options.get(b'rust.index')

1687

1691

1688

self._parse_index = parse_index_v1

1692

self._parse_index = parse_index_v1

1689

if self._format_version == REVLOGV0:

1693

if self._format_version == REVLOGV0:

1690

self._parse_index = revlogv0.parse_index_v0

1694

self._parse_index = revlogv0.parse_index_v0

1691

elif self._format_version == REVLOGV2:

1695

elif self._format_version == REVLOGV2:

1692

self._parse_index = parse_index_v2

1696

self._parse_index = parse_index_v2

1693

elif self._format_version == CHANGELOGV2:

1697

elif self._format_version == CHANGELOGV2:

1694

self._parse_index = parse_index_cl_v2

1698

self._parse_index = parse_index_cl_v2

1695

elif devel_nodemap:

1699

elif devel_nodemap:

1696

self._parse_index = parse_index_v1_nodemap

1700

self._parse_index = parse_index_v1_nodemap

1697

elif use_rust_index:

1701

elif use_rust_index:

1698

self._parse_index = parse_index_v1_mixed

1702

self._parse_index = parse_index_v1_mixed

1699

try:

1703

try:

1700

d = self._parse_index(index_data, self._inline)

1704

d = self._parse_index(index_data, self._inline)

1701

index, chunkcache = d

1705

index, chunkcache = d

1702

use_nodemap = (

1706

use_nodemap = (

1703

not self._inline

1707

not self._inline

1704

and self._nodemap_file is not None

1708

and self._nodemap_file is not None

1705

and hasattr(index, 'update_nodemap_data')

1709

and hasattr(index, 'update_nodemap_data')

1706

)

1710

)

1707

if use_nodemap:

1711

if use_nodemap:

1708

nodemap_data = nodemaputil.persisted_data(self)

1712

nodemap_data = nodemaputil.persisted_data(self)

1709

if nodemap_data is not None:

1713

if nodemap_data is not None:

1710

docket = nodemap_data[0]

1714

docket = nodemap_data[0]

1711

if (

1715

if (

1712

len(d[0]) > docket.tip_rev

1716

len(d[0]) > docket.tip_rev

1713

and d[0][docket.tip_rev][7] == docket.tip_node

1717

and d[0][docket.tip_rev][7] == docket.tip_node

1714

):

1718

):

1715

# no changelog tampering

1719

# no changelog tampering

1716

self._nodemap_docket = docket

1720

self._nodemap_docket = docket

1717

index.update_nodemap_data(*nodemap_data)

1721

index.update_nodemap_data(*nodemap_data)

1718

except (ValueError, IndexError):

1722

except (ValueError, IndexError):

1719

raise error.RevlogError(

1723

raise error.RevlogError(

1720

_(b"index %s is corrupted") % self.display_id

1724

_(b"index %s is corrupted") % self.display_id

1721

)

1725

)

1722

self.index = index

1726

self.index = index

1723

# revnum -> (chain-length, sum-delta-length)

1727

# revnum -> (chain-length, sum-delta-length)

1724

self._chaininfocache = util.lrucachedict(500)

1728

self._chaininfocache = util.lrucachedict(500)

1725

1729

1726

return chunkcache

1730

return chunkcache

1727

1731

1728

def _load_inner(self, chunk_cache):

1732

def _load_inner(self, chunk_cache):

1729

if self._docket is None:

1733

if self._docket is None:

1730

default_compression_header = None

1734

default_compression_header = None

1731

else:

1735

else:

1732

default_compression_header = self._docket.default_compression_header

1736

default_compression_header = self._docket.default_compression_header

1733

1737

1734

self._inner = _InnerRevlog(

1738

self._inner = _InnerRevlog(

1735

opener=self.opener,

1739

opener=self.opener,

1736

index=self.index,

1740

index=self.index,

1737

index_file=self._indexfile,

1741

index_file=self._indexfile,

1738

data_file=self._datafile,

1742

data_file=self._datafile,

1739

sidedata_file=self._sidedatafile,

1743

sidedata_file=self._sidedatafile,

1740

inline=self._inline,

1744

inline=self._inline,

1741

data_config=self.data_config,

1745

data_config=self.data_config,

1742

delta_config=self.delta_config,

1746

delta_config=self.delta_config,

1743

feature_config=self.feature_config,

1747

feature_config=self.feature_config,

1744

chunk_cache=chunk_cache,

1748

chunk_cache=chunk_cache,

1745

default_compression_header=default_compression_header,

1749

default_compression_header=default_compression_header,

1746

)

1750

)

1747

1751

1748

def get_revlog(self):

1752

def get_revlog(self):

1749

"""simple function to mirror API of other not-really-revlog API"""

1753

"""simple function to mirror API of other not-really-revlog API"""

1750

return self

1754

return self

1751

1755

1752

@util.propertycache

1756

@util.propertycache

1753

def revlog_kind(self):

1757

def revlog_kind(self):

1754

return self.target[0]

1758

return self.target[0]

1755

1759

1756

@util.propertycache

1760

@util.propertycache

1757

def display_id(self):

1761

def display_id(self):

1758

"""The public facing "ID" of the revlog that we use in message"""

1762

"""The public facing "ID" of the revlog that we use in message"""

1759

if self.revlog_kind == KIND_FILELOG:

1763

if self.revlog_kind == KIND_FILELOG:

1760

# Reference the file without the "data/" prefix, so it is familiar

1764

# Reference the file without the "data/" prefix, so it is familiar

1761

# to the user.

1765

# to the user.

1762

return self.target[1]

1766

return self.target[1]

1763

else:

1767

else:

1764

return self.radix

1768

return self.radix

1765

1769

1766

def _datafp(self, mode=b'r'):

1770

def _datafp(self, mode=b'r'):

1767

"""file object for the revlog's data file"""

1771

"""file object for the revlog's data file"""

1768

return self.opener(self._datafile, mode=mode)

1772

return self.opener(self._datafile, mode=mode)

1769

1773

1770

def tiprev(self):

1774

def tiprev(self):

1771

return len(self.index) - 1

1775

return len(self.index) - 1

1772

1776

1773

def tip(self):

1777

def tip(self):

1774

return self.node(self.tiprev())

1778

return self.node(self.tiprev())

1775

1779

1776

def __contains__(self, rev):

1780

def __contains__(self, rev):

1777

return 0 <= rev < len(self)

1781

return 0 <= rev < len(self)

1778

1782

1779

def __len__(self):

1783

def __len__(self):

1780

return len(self.index)

1784

return len(self.index)

1781

1785

1782

def __iter__(self):

1786

def __iter__(self):

1783

return iter(range(len(self)))

1787

return iter(range(len(self)))

1784

1788

1785

def revs(self, start=0, stop=None):

1789

def revs(self, start=0, stop=None):

1786

"""iterate over all rev in this revlog (from start to stop)"""

1790

"""iterate over all rev in this revlog (from start to stop)"""

1787

return storageutil.iterrevs(len(self), start=start, stop=stop)

1791

return storageutil.iterrevs(len(self), start=start, stop=stop)

1788

1792

1789

def hasnode(self, node):

1793

def hasnode(self, node):

1790

try:

1794

try:

1791

self.rev(node)

1795

self.rev(node)

1792

return True

1796

return True

1793

except KeyError:

1797

except KeyError:

1794

return False

1798

return False

1795

1799

1796

def _candelta(self, baserev, rev):

1800

def _candelta(self, baserev, rev):

1797

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1801

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1798

# Disable delta if either rev requires a content-changing flag

1802

# Disable delta if either rev requires a content-changing flag

1799

# processor (ex. LFS). This is because such flag processor can alter

1803

# processor (ex. LFS). This is because such flag processor can alter

1800

# the rawtext content that the delta will be based on, and two clients

1804

# the rawtext content that the delta will be based on, and two clients

1801

# could have a same revlog node with different flags (i.e. different

1805

# could have a same revlog node with different flags (i.e. different

1802

# rawtext contents) and the delta could be incompatible.

1806

# rawtext contents) and the delta could be incompatible.

1803

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1807

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1804

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1808

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1805

):

1809

):

1806

return False

1810

return False

1807

return True

1811

return True

1808

1812

1809

def update_caches(self, transaction):

1813

def update_caches(self, transaction):

1810

"""update on disk cache

1814

"""update on disk cache

1811

1815

1812

If a transaction is passed, the update may be delayed to transaction

1816

If a transaction is passed, the update may be delayed to transaction

1813

commit."""

1817

commit."""

1814

if self._nodemap_file is not None:

1818

if self._nodemap_file is not None:

1815

if transaction is None:

1819

if transaction is None:

1816

nodemaputil.update_persistent_nodemap(self)

1820

nodemaputil.update_persistent_nodemap(self)

1817

else:

1821

else:

1818

nodemaputil.setup_persistent_nodemap(transaction, self)

1822

nodemaputil.setup_persistent_nodemap(transaction, self)

1819

1823

1820

def clearcaches(self):

1824

def clearcaches(self):

1821

"""Clear in-memory caches"""

1825

"""Clear in-memory caches"""

1822

self._chainbasecache.clear()

1826

self._chainbasecache.clear()

1823

self._inner.clear_cache()

1827

self._inner.clear_cache()

1824

self._pcache = {}

1828

self._pcache = {}

1825

self._nodemap_docket = None

1829

self._nodemap_docket = None

1826

self.index.clearcaches()

1830

self.index.clearcaches()

1827

# The python code is the one responsible for validating the docket, we

1831

# The python code is the one responsible for validating the docket, we

1828

# end up having to refresh it here.

1832

# end up having to refresh it here.

1829

use_nodemap = (

1833

use_nodemap = (

1830

not self._inline

1834

not self._inline

1831

and self._nodemap_file is not None

1835

and self._nodemap_file is not None

1832

and hasattr(self.index, 'update_nodemap_data')

1836

and hasattr(self.index, 'update_nodemap_data')

1833

)

1837

)

1834

if use_nodemap:

1838

if use_nodemap:

1835

nodemap_data = nodemaputil.persisted_data(self)

1839

nodemap_data = nodemaputil.persisted_data(self)

1836

if nodemap_data is not None:

1840

if nodemap_data is not None:

1837

self._nodemap_docket = nodemap_data[0]

1841

self._nodemap_docket = nodemap_data[0]

1838

self.index.update_nodemap_data(*nodemap_data)

1842

self.index.update_nodemap_data(*nodemap_data)

1839

1843

1840

def rev(self, node):

1844

def rev(self, node):

1841

"""return the revision number associated with a <nodeid>"""

1845

"""return the revision number associated with a <nodeid>"""

1842

try:

1846

try:

1843

return self.index.rev(node)

1847

return self.index.rev(node)

1844

except TypeError:

1848

except TypeError:

1845

raise

1849

raise

1846

except error.RevlogError:

1850

except error.RevlogError:

1847

# parsers.c radix tree lookup failed

1851

# parsers.c radix tree lookup failed

1848

if (

1852

if (

1849

node == self.nodeconstants.wdirid

1853

node == self.nodeconstants.wdirid

1850

or node in self.nodeconstants.wdirfilenodeids

1854

or node in self.nodeconstants.wdirfilenodeids

1851

):

1855

):

1852

raise error.WdirUnsupported

1856

raise error.WdirUnsupported

1853

raise error.LookupError(node, self.display_id, _(b'no node'))

1857

raise error.LookupError(node, self.display_id, _(b'no node'))

1854

1858

1855

# Accessors for index entries.

1859

# Accessors for index entries.

1856

1860

1857

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1861

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1858

# are flags.

1862

# are flags.

1859

def start(self, rev):

1863

def start(self, rev):

1860

return int(self.index[rev][0] >> 16)

1864

return int(self.index[rev][0] >> 16)

1861

1865

1862

def sidedata_cut_off(self, rev):

1866

def sidedata_cut_off(self, rev):

1863

sd_cut_off = self.index[rev][8]

1867

sd_cut_off = self.index[rev][8]

1864

if sd_cut_off != 0:

1868

if sd_cut_off != 0:

1865

return sd_cut_off

1869

return sd_cut_off

1866

# This is some annoying dance, because entries without sidedata

1870

# This is some annoying dance, because entries without sidedata

1867

# currently use 0 as their ofsset. (instead of previous-offset +

1871

# currently use 0 as their ofsset. (instead of previous-offset +

1868

# previous-size)

1872

# previous-size)

1869

#

1873

#

1870

# We should reconsider this sidedata → 0 sidata_offset policy.

1874

# We should reconsider this sidedata → 0 sidata_offset policy.

1871

# In the meantime, we need this.

1875

# In the meantime, we need this.

1872

while 0 <= rev:

1876

while 0 <= rev:

1873

e = self.index[rev]

1877

e = self.index[rev]

1874

if e[9] != 0:

1878

if e[9] != 0:

1875

return e[8] + e[9]

1879

return e[8] + e[9]

1876

rev -= 1

1880

rev -= 1

1877

return 0

1881

return 0

1878

1882

1879

def flags(self, rev):

1883

def flags(self, rev):

1880

return self.index[rev][0] & 0xFFFF

1884

return self.index[rev][0] & 0xFFFF

1881

1885

1882

def length(self, rev):

1886

def length(self, rev):

1883

return self.index[rev][1]

1887

return self.index[rev][1]

1884

1888

1885

def sidedata_length(self, rev):

1889

def sidedata_length(self, rev):

1886

if not self.feature_config.has_side_data:

1890

if not self.feature_config.has_side_data:

1887

return 0

1891

return 0

1888

return self.index[rev][9]

1892

return self.index[rev][9]

1889

1893

1890

def rawsize(self, rev):

1894

def rawsize(self, rev):

1891

"""return the length of the uncompressed text for a given revision"""

1895

"""return the length of the uncompressed text for a given revision"""

1892

l = self.index[rev][2]

1896

l = self.index[rev][2]

1893

if l >= 0:

1897

if l >= 0:

1894

return l

1898

return l

1895

1899

1896

t = self.rawdata(rev)

1900

t = self.rawdata(rev)

1897

return len(t)

1901

return len(t)

1898

1902

1899

def size(self, rev):

1903

def size(self, rev):

1900

"""length of non-raw text (processed by a "read" flag processor)"""

1904

"""length of non-raw text (processed by a "read" flag processor)"""

1901

# fast path: if no "read" flag processor could change the content,

1905

# fast path: if no "read" flag processor could change the content,

1902

# size is rawsize. note: ELLIPSIS is known to not change the content.

1906

# size is rawsize. note: ELLIPSIS is known to not change the content.

1903

flags = self.flags(rev)

1907

flags = self.flags(rev)

1904

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1908

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1905

return self.rawsize(rev)

1909

return self.rawsize(rev)

1906

1910

1907

return len(self.revision(rev))

1911

return len(self.revision(rev))

1908

1912

1909

def fast_rank(self, rev):

1913

def fast_rank(self, rev):

1910

"""Return the rank of a revision if already known, or None otherwise.

1914

"""Return the rank of a revision if already known, or None otherwise.

1911

1915

1912

The rank of a revision is the size of the sub-graph it defines as a

1916

The rank of a revision is the size of the sub-graph it defines as a

1913

head. Equivalently, the rank of a revision `r` is the size of the set

1917

head. Equivalently, the rank of a revision `r` is the size of the set

1914

`ancestors(r)`, `r` included.

1918

`ancestors(r)`, `r` included.

1915

1919

1916

This method returns the rank retrieved from the revlog in constant

1920

This method returns the rank retrieved from the revlog in constant

1917

time. It makes no attempt at computing unknown values for versions of

1921

time. It makes no attempt at computing unknown values for versions of

1918

the revlog which do not persist the rank.

1922

the revlog which do not persist the rank.

1919

"""

1923

"""

1920

rank = self.index[rev][ENTRY_RANK]

1924

rank = self.index[rev][ENTRY_RANK]

1921

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1925

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1922

return None

1926

return None

1923

if rev == nullrev:

1927

if rev == nullrev:

1924

return 0 # convention

1928

return 0 # convention

1925

return rank

1929

return rank

1926

1930

1927

def chainbase(self, rev):

1931

def chainbase(self, rev):

1928

base = self._chainbasecache.get(rev)

1932

base = self._chainbasecache.get(rev)

1929

if base is not None:

1933

if base is not None:

1930

return base

1934

return base

1931

1935

1932

index = self.index

1936

index = self.index

1933

iterrev = rev

1937

iterrev = rev

1934

base = index[iterrev][3]

1938

base = index[iterrev][3]

1935

while base != iterrev:

1939

while base != iterrev:

1936

iterrev = base

1940

iterrev = base

1937

base = index[iterrev][3]

1941

base = index[iterrev][3]

1938

1942

1939

self._chainbasecache[rev] = base

1943

self._chainbasecache[rev] = base

1940

return base

1944

return base

1941

1945

1942

def linkrev(self, rev):

1946

def linkrev(self, rev):

1943

return self.index[rev][4]

1947

return self.index[rev][4]

1944

1948

1945

def parentrevs(self, rev):

1949

def parentrevs(self, rev):

1946

try:

1950

try:

1947

entry = self.index[rev]

1951

entry = self.index[rev]

1948

except IndexError:

1952

except IndexError:

1949

if rev == wdirrev:

1953

if rev == wdirrev:

1950

raise error.WdirUnsupported

1954

raise error.WdirUnsupported

1951

raise

1955

raise

1952

1956

1953

if self.feature_config.canonical_parent_order and entry[5] == nullrev:

1957

if self.feature_config.canonical_parent_order and entry[5] == nullrev:

1954

return entry[6], entry[5]

1958

return entry[6], entry[5]

1955

else:

1959

else:

1956

return entry[5], entry[6]

1960

return entry[5], entry[6]

1957

1961

1958

# fast parentrevs(rev) where rev isn't filtered

1962

# fast parentrevs(rev) where rev isn't filtered

1959

_uncheckedparentrevs = parentrevs

1963

_uncheckedparentrevs = parentrevs

1960

1964

1961

def node(self, rev):

1965

def node(self, rev):

1962

try:

1966

try:

1963

return self.index[rev][7]

1967

return self.index[rev][7]

1964

except IndexError:

1968

except IndexError:

1965

if rev == wdirrev:

1969

if rev == wdirrev:

1966

raise error.WdirUnsupported

1970

raise error.WdirUnsupported

1967

raise

1971

raise

1968

1972

1969

# Derived from index values.

1973

# Derived from index values.

1970

1974

1971

def end(self, rev):

1975

def end(self, rev):

1972

return self.start(rev) + self.length(rev)

1976

return self.start(rev) + self.length(rev)

1973

1977

1974

def parents(self, node):

1978

def parents(self, node):

1975

i = self.index

1979

i = self.index

1976

d = i[self.rev(node)]

1980

d = i[self.rev(node)]

1977

# inline node() to avoid function call overhead

1981

# inline node() to avoid function call overhead

1978

if self.feature_config.canonical_parent_order and d[5] == self.nullid:

1982

if self.feature_config.canonical_parent_order and d[5] == self.nullid:

1979

return i[d[6]][7], i[d[5]][7]

1983

return i[d[6]][7], i[d[5]][7]

1980

else:

1984

else:

1981

return i[d[5]][7], i[d[6]][7]

1985

return i[d[5]][7], i[d[6]][7]

1982

1986

1983

def chainlen(self, rev):

1987

def chainlen(self, rev):

1984

return self._chaininfo(rev)[0]

1988

return self._chaininfo(rev)[0]

1985

1989

1986

def _chaininfo(self, rev):

1990

def _chaininfo(self, rev):

1987

chaininfocache = self._chaininfocache

1991

chaininfocache = self._chaininfocache

1988

if rev in chaininfocache:

1992

if rev in chaininfocache:

1989

return chaininfocache[rev]

1993

return chaininfocache[rev]

1990

index = self.index

1994

index = self.index

1991

generaldelta = self.delta_config.general_delta

1995

generaldelta = self.delta_config.general_delta

1992

iterrev = rev

1996

iterrev = rev

1993

e = index[iterrev]

1997

e = index[iterrev]

1994

clen = 0

1998

clen = 0

1995

compresseddeltalen = 0

1999

compresseddeltalen = 0

1996

while iterrev != e[3]:

2000

while iterrev != e[3]:

1997

clen += 1

2001

clen += 1

1998

compresseddeltalen += e[1]

2002

compresseddeltalen += e[1]

1999

if generaldelta:

2003

if generaldelta:

2000

iterrev = e[3]

2004

iterrev = e[3]

2001

else:

2005

else:

2002

iterrev -= 1

2006

iterrev -= 1

2003

if iterrev in chaininfocache:

2007

if iterrev in chaininfocache:

2004

t = chaininfocache[iterrev]

2008

t = chaininfocache[iterrev]

2005

clen += t[0]

2009

clen += t[0]

2006

compresseddeltalen += t[1]

2010

compresseddeltalen += t[1]

2007

break

2011

break

2008

e = index[iterrev]

2012

e = index[iterrev]

2009

else:

2013

else:

2010

# Add text length of base since decompressing that also takes

2014

# Add text length of base since decompressing that also takes

2011

# work. For cache hits the length is already included.

2015

# work. For cache hits the length is already included.

2012

compresseddeltalen += e[1]

2016

compresseddeltalen += e[1]

2013

r = (clen, compresseddeltalen)

2017

r = (clen, compresseddeltalen)

2014

chaininfocache[rev] = r

2018

chaininfocache[rev] = r

2015

return r

2019

return r

2016

2020

2017

def _deltachain(self, rev, stoprev=None):

2021

def _deltachain(self, rev, stoprev=None):

2018

return self._inner._deltachain(rev, stoprev=stoprev)

2022

return self._inner._deltachain(rev, stoprev=stoprev)

2019

2023

2020

def ancestors(self, revs, stoprev=0, inclusive=False):

2024

def ancestors(self, revs, stoprev=0, inclusive=False):

2021

"""Generate the ancestors of 'revs' in reverse revision order.

2025

"""Generate the ancestors of 'revs' in reverse revision order.

2022

Does not generate revs lower than stoprev.

2026

Does not generate revs lower than stoprev.

2023

2027

2024

See the documentation for ancestor.lazyancestors for more details."""

2028

See the documentation for ancestor.lazyancestors for more details."""

2025

2029

2026

# first, make sure start revisions aren't filtered

2030

# first, make sure start revisions aren't filtered

2027

revs = list(revs)

2031

revs = list(revs)

2028

checkrev = self.node

2032

checkrev = self.node

2029

for r in revs:

2033

for r in revs:

2030

checkrev(r)

2034

checkrev(r)

2031

# and we're sure ancestors aren't filtered as well

2035

# and we're sure ancestors aren't filtered as well

2032

2036

2033

if rustancestor is not None and self.index.rust_ext_compat:

2037

if rustancestor is not None and self.index.rust_ext_compat:

2034

lazyancestors = rustancestor.LazyAncestors

2038

lazyancestors = rustancestor.LazyAncestors

2035

arg = self.index

2039

arg = self.index

2036

else:

2040

else:

2037

lazyancestors = ancestor.lazyancestors

2041

lazyancestors = ancestor.lazyancestors

2038

arg = self._uncheckedparentrevs

2042

arg = self._uncheckedparentrevs

2039

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

2043

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

2040

2044

2041

def descendants(self, revs):

2045

def descendants(self, revs):

2042

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

2046

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

2043

2047

2044

def findcommonmissing(self, common=None, heads=None):

2048

def findcommonmissing(self, common=None, heads=None):

2045

"""Return a tuple of the ancestors of common and the ancestors of heads

2049

"""Return a tuple of the ancestors of common and the ancestors of heads

2046

that are not ancestors of common. In revset terminology, we return the

2050

that are not ancestors of common. In revset terminology, we return the

2047

tuple:

2051

tuple:

2048

2052

2049

::common, (::heads) - (::common)

2053

::common, (::heads) - (::common)

2050

2054

2051

The list is sorted by revision number, meaning it is

2055

The list is sorted by revision number, meaning it is

2052

topologically sorted.

2056

topologically sorted.

2053

2057

2054

'heads' and 'common' are both lists of node IDs. If heads is

2058

'heads' and 'common' are both lists of node IDs. If heads is

2055

not supplied, uses all of the revlog's heads. If common is not

2059

not supplied, uses all of the revlog's heads. If common is not

2056

supplied, uses nullid."""

2060

supplied, uses nullid."""

2057

if common is None:

2061

if common is None:

2058

common = [self.nullid]

2062

common = [self.nullid]

2059

if heads is None:

2063

if heads is None:

2060

heads = self.heads()

2064

heads = self.heads()

2061

2065

2062

common = [self.rev(n) for n in common]

2066

common = [self.rev(n) for n in common]

2063

heads = [self.rev(n) for n in heads]

2067

heads = [self.rev(n) for n in heads]

2064

2068

2065

# we want the ancestors, but inclusive

2069

# we want the ancestors, but inclusive

2066

class lazyset:

2070

class lazyset:

2067

def __init__(self, lazyvalues):

2071

def __init__(self, lazyvalues):

2068

self.addedvalues = set()

2072

self.addedvalues = set()

2069

self.lazyvalues = lazyvalues

2073

self.lazyvalues = lazyvalues

2070

2074

2071

def __contains__(self, value):

2075

def __contains__(self, value):

2072

return value in self.addedvalues or value in self.lazyvalues

2076

return value in self.addedvalues or value in self.lazyvalues

2073

2077

2074

def __iter__(self):

2078

def __iter__(self):

2075

added = self.addedvalues

2079

added = self.addedvalues

2076

for r in added:

2080

for r in added:

2077

yield r

2081

yield r

2078

for r in self.lazyvalues:

2082

for r in self.lazyvalues:

2079

if not r in added:

2083

if not r in added:

2080

yield r

2084

yield r

2081

2085

2082

def add(self, value):

2086

def add(self, value):

2083

self.addedvalues.add(value)

2087

self.addedvalues.add(value)

2084

2088

2085

def update(self, values):

2089

def update(self, values):

2086

self.addedvalues.update(values)

2090

self.addedvalues.update(values)

2087

2091

2088

has = lazyset(self.ancestors(common))

2092

has = lazyset(self.ancestors(common))

2089

has.add(nullrev)

2093

has.add(nullrev)

2090

has.update(common)

2094

has.update(common)

2091

2095

2092

# take all ancestors from heads that aren't in has

2096

# take all ancestors from heads that aren't in has

2093

missing = set()

2097

missing = set()

2094

visit = collections.deque(r for r in heads if r not in has)

2098

visit = collections.deque(r for r in heads if r not in has)

2095

while visit:

2099

while visit:

2096

r = visit.popleft()

2100

r = visit.popleft()

2097

if r in missing:

2101

if r in missing:

2098

continue

2102

continue

2099

else:

2103

else:

2100

missing.add(r)

2104

missing.add(r)

2101

for p in self.parentrevs(r):

2105

for p in self.parentrevs(r):

2102

if p not in has:

2106

if p not in has:

2103

visit.append(p)

2107

visit.append(p)

2104

missing = list(missing)

2108

missing = list(missing)

2105

missing.sort()

2109

missing.sort()

2106

return has, [self.node(miss) for miss in missing]

2110

return has, [self.node(miss) for miss in missing]

2107

2111

2108

def incrementalmissingrevs(self, common=None):

2112

def incrementalmissingrevs(self, common=None):

2109

"""Return an object that can be used to incrementally compute the

2113

"""Return an object that can be used to incrementally compute the

2110

revision numbers of the ancestors of arbitrary sets that are not

2114

revision numbers of the ancestors of arbitrary sets that are not

2111

ancestors of common. This is an ancestor.incrementalmissingancestors

2115

ancestors of common. This is an ancestor.incrementalmissingancestors

2112

object.

2116

object.

2113

2117

2114

'common' is a list of revision numbers. If common is not supplied, uses

2118

'common' is a list of revision numbers. If common is not supplied, uses

2115

nullrev.

2119

nullrev.

2116

"""

2120

"""

2117

if common is None:

2121

if common is None:

2118

common = [nullrev]

2122

common = [nullrev]

2119

2123

2120

if rustancestor is not None and self.index.rust_ext_compat:

2124

if rustancestor is not None and self.index.rust_ext_compat:

2121

return rustancestor.MissingAncestors(self.index, common)

2125

return rustancestor.MissingAncestors(self.index, common)

2122

return ancestor.incrementalmissingancestors(self.parentrevs, common)

2126

return ancestor.incrementalmissingancestors(self.parentrevs, common)

2123

2127

2124

def findmissingrevs(self, common=None, heads=None):

2128

def findmissingrevs(self, common=None, heads=None):

2125

"""Return the revision numbers of the ancestors of heads that

2129

"""Return the revision numbers of the ancestors of heads that

2126

are not ancestors of common.

2130

are not ancestors of common.

2127

2131

2128

More specifically, return a list of revision numbers corresponding to

2132

More specifically, return a list of revision numbers corresponding to

2129

nodes N such that every N satisfies the following constraints:

2133

nodes N such that every N satisfies the following constraints:

2130

2134

2131

1. N is an ancestor of some node in 'heads'

2135

1. N is an ancestor of some node in 'heads'

2132

2. N is not an ancestor of any node in 'common'

2136

2. N is not an ancestor of any node in 'common'

2133

2137

2134

The list is sorted by revision number, meaning it is

2138

The list is sorted by revision number, meaning it is

2135

topologically sorted.

2139

topologically sorted.

2136

2140

2137

'heads' and 'common' are both lists of revision numbers. If heads is

2141

'heads' and 'common' are both lists of revision numbers. If heads is

2138

not supplied, uses all of the revlog's heads. If common is not

2142

not supplied, uses all of the revlog's heads. If common is not

2139

supplied, uses nullid."""

2143

supplied, uses nullid."""

2140

if common is None:

2144

if common is None:

2141

common = [nullrev]

2145

common = [nullrev]

2142

if heads is None:

2146

if heads is None:

2143

heads = self.headrevs()

2147

heads = self.headrevs()

2144

2148

2145

inc = self.incrementalmissingrevs(common=common)

2149

inc = self.incrementalmissingrevs(common=common)

2146

return inc.missingancestors(heads)

2150

return inc.missingancestors(heads)

2147

2151

2148

def findmissing(self, common=None, heads=None):

2152

def findmissing(self, common=None, heads=None):

2149

"""Return the ancestors of heads that are not ancestors of common.

2153

"""Return the ancestors of heads that are not ancestors of common.

2150

2154

2151

More specifically, return a list of nodes N such that every N

2155

More specifically, return a list of nodes N such that every N

2152

satisfies the following constraints:

2156

satisfies the following constraints:

2153

2157

2154

1. N is an ancestor of some node in 'heads'

2158

1. N is an ancestor of some node in 'heads'

2155

2. N is not an ancestor of any node in 'common'

2159

2. N is not an ancestor of any node in 'common'

2156

2160

2157

The list is sorted by revision number, meaning it is

2161

The list is sorted by revision number, meaning it is

2158

topologically sorted.

2162

topologically sorted.

2159

2163

2160

'heads' and 'common' are both lists of node IDs. If heads is

2164

'heads' and 'common' are both lists of node IDs. If heads is

2161

not supplied, uses all of the revlog's heads. If common is not

2165

not supplied, uses all of the revlog's heads. If common is not

2162

supplied, uses nullid."""

2166

supplied, uses nullid."""

2163

if common is None:

2167

if common is None:

2164

common = [self.nullid]

2168

common = [self.nullid]

2165

if heads is None:

2169

if heads is None:

2166

heads = self.heads()

2170

heads = self.heads()

2167

2171

2168

common = [self.rev(n) for n in common]

2172

common = [self.rev(n) for n in common]

2169

heads = [self.rev(n) for n in heads]

2173

heads = [self.rev(n) for n in heads]

2170

2174

2171

inc = self.incrementalmissingrevs(common=common)

2175

inc = self.incrementalmissingrevs(common=common)

2172

return [self.node(r) for r in inc.missingancestors(heads)]

2176

return [self.node(r) for r in inc.missingancestors(heads)]

2173

2177

2174

def nodesbetween(self, roots=None, heads=None):

2178

def nodesbetween(self, roots=None, heads=None):

2175

"""Return a topological path from 'roots' to 'heads'.

2179

"""Return a topological path from 'roots' to 'heads'.

2176

2180

2177

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

2181

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

2178

topologically sorted list of all nodes N that satisfy both of

2182

topologically sorted list of all nodes N that satisfy both of

2179

these constraints:

2183

these constraints:

2180

2184

2181

1. N is a descendant of some node in 'roots'

2185

1. N is a descendant of some node in 'roots'

2182

2. N is an ancestor of some node in 'heads'

2186

2. N is an ancestor of some node in 'heads'

2183

2187

2184

Every node is considered to be both a descendant and an ancestor

2188

Every node is considered to be both a descendant and an ancestor

2185

of itself, so every reachable node in 'roots' and 'heads' will be

2189

of itself, so every reachable node in 'roots' and 'heads' will be

2186

included in 'nodes'.

2190

included in 'nodes'.

2187

2191

2188

'outroots' is the list of reachable nodes in 'roots', i.e., the

2192

'outroots' is the list of reachable nodes in 'roots', i.e., the

2189

subset of 'roots' that is returned in 'nodes'. Likewise,

2193

subset of 'roots' that is returned in 'nodes'. Likewise,

2190

'outheads' is the subset of 'heads' that is also in 'nodes'.

2194

'outheads' is the subset of 'heads' that is also in 'nodes'.

2191

2195

2192

'roots' and 'heads' are both lists of node IDs. If 'roots' is

2196

'roots' and 'heads' are both lists of node IDs. If 'roots' is

2193

unspecified, uses nullid as the only root. If 'heads' is

2197

unspecified, uses nullid as the only root. If 'heads' is

2194

unspecified, uses list of all of the revlog's heads."""

2198

unspecified, uses list of all of the revlog's heads."""

2195

nonodes = ([], [], [])

2199

nonodes = ([], [], [])

2196

if roots is not None:

2200

if roots is not None:

2197

roots = list(roots)

2201

roots = list(roots)

2198

if not roots:

2202

if not roots:

2199

return nonodes

2203

return nonodes

2200

lowestrev = min([self.rev(n) for n in roots])

2204

lowestrev = min([self.rev(n) for n in roots])

2201

else:

2205

else:

2202

roots = [self.nullid] # Everybody's a descendant of nullid

2206

roots = [self.nullid] # Everybody's a descendant of nullid

2203

lowestrev = nullrev

2207

lowestrev = nullrev

2204

if (lowestrev == nullrev) and (heads is None):

2208

if (lowestrev == nullrev) and (heads is None):

2205

# We want _all_ the nodes!

2209

# We want _all_ the nodes!

2206

return (

2210

return (

2207

[self.node(r) for r in self],

2211

[self.node(r) for r in self],

2208

[self.nullid],

2212

[self.nullid],

2209

list(self.heads()),

2213

list(self.heads()),

2210

)

2214

)

2211

if heads is None:

2215

if heads is None:

2212

# All nodes are ancestors, so the latest ancestor is the last

2216

# All nodes are ancestors, so the latest ancestor is the last

2213

# node.

2217

# node.

2214

highestrev = len(self) - 1

2218

highestrev = len(self) - 1

2215

# Set ancestors to None to signal that every node is an ancestor.

2219

# Set ancestors to None to signal that every node is an ancestor.

2216

ancestors = None

2220

ancestors = None

2217

# Set heads to an empty dictionary for later discovery of heads

2221

# Set heads to an empty dictionary for later discovery of heads

2218

heads = {}

2222

heads = {}

2219

else:

2223

else:

2220

heads = list(heads)

2224

heads = list(heads)

2221

if not heads:

2225

if not heads:

2222

return nonodes

2226

return nonodes

2223

ancestors = set()

2227

ancestors = set()

2224

# Turn heads into a dictionary so we can remove 'fake' heads.

2228

# Turn heads into a dictionary so we can remove 'fake' heads.

2225

# Also, later we will be using it to filter out the heads we can't

2229

# Also, later we will be using it to filter out the heads we can't

2226

# find from roots.

2230

# find from roots.

2227

heads = dict.fromkeys(heads, False)

2231

heads = dict.fromkeys(heads, False)

2228

# Start at the top and keep marking parents until we're done.

2232

# Start at the top and keep marking parents until we're done.

2229

nodestotag = set(heads)

2233

nodestotag = set(heads)

2230

# Remember where the top was so we can use it as a limit later.

2234

# Remember where the top was so we can use it as a limit later.

2231

highestrev = max([self.rev(n) for n in nodestotag])

2235

highestrev = max([self.rev(n) for n in nodestotag])

2232

while nodestotag:

2236

while nodestotag:

2233

# grab a node to tag

2237

# grab a node to tag

2234

n = nodestotag.pop()

2238

n = nodestotag.pop()

2235

# Never tag nullid

2239

# Never tag nullid

2236

if n == self.nullid:

2240

if n == self.nullid:

2237

continue

2241

continue

2238

# A node's revision number represents its place in a

2242

# A node's revision number represents its place in a

2239

# topologically sorted list of nodes.

2243

# topologically sorted list of nodes.

2240

r = self.rev(n)

2244

r = self.rev(n)

2241

if r >= lowestrev:

2245

if r >= lowestrev:

2242

if n not in ancestors:

2246

if n not in ancestors:

2243

# If we are possibly a descendant of one of the roots

2247

# If we are possibly a descendant of one of the roots

2244

# and we haven't already been marked as an ancestor

2248

# and we haven't already been marked as an ancestor

2245

ancestors.add(n) # Mark as ancestor

2249

ancestors.add(n) # Mark as ancestor

2246

# Add non-nullid parents to list of nodes to tag.

2250

# Add non-nullid parents to list of nodes to tag.

2247

nodestotag.update(

2251

nodestotag.update(

2248

[p for p in self.parents(n) if p != self.nullid]

2252

[p for p in self.parents(n) if p != self.nullid]

2249

)

2253

)

2250

elif n in heads: # We've seen it before, is it a fake head?

2254

elif n in heads: # We've seen it before, is it a fake head?

2251

# So it is, real heads should not be the ancestors of

2255

# So it is, real heads should not be the ancestors of

2252

# any other heads.

2256

# any other heads.

2253

heads.pop(n)

2257

heads.pop(n)

2254

if not ancestors:

2258

if not ancestors:

2255

return nonodes

2259

return nonodes

2256

# Now that we have our set of ancestors, we want to remove any

2260

# Now that we have our set of ancestors, we want to remove any

2257

# roots that are not ancestors.

2261

# roots that are not ancestors.

2258

2262

2259

# If one of the roots was nullid, everything is included anyway.

2263

# If one of the roots was nullid, everything is included anyway.

2260

if lowestrev > nullrev:

2264

if lowestrev > nullrev:

2261

# But, since we weren't, let's recompute the lowest rev to not

2265

# But, since we weren't, let's recompute the lowest rev to not

2262

# include roots that aren't ancestors.

2266

# include roots that aren't ancestors.

2263

2267

2264

# Filter out roots that aren't ancestors of heads

2268

# Filter out roots that aren't ancestors of heads

2265

roots = [root for root in roots if root in ancestors]

2269

roots = [root for root in roots if root in ancestors]

2266

# Recompute the lowest revision

2270

# Recompute the lowest revision

2267

if roots:

2271

if roots:

2268

lowestrev = min([self.rev(root) for root in roots])

2272

lowestrev = min([self.rev(root) for root in roots])

2269

else:

2273

else:

2270

# No more roots? Return empty list

2274

# No more roots? Return empty list

2271

return nonodes

2275

return nonodes

2272

else:

2276

else:

2273

# We are descending from nullid, and don't need to care about

2277

# We are descending from nullid, and don't need to care about

2274

# any other roots.

2278

# any other roots.

2275

lowestrev = nullrev

2279

lowestrev = nullrev

2276

roots = [self.nullid]

2280

roots = [self.nullid]

2277

# Transform our roots list into a set.

2281

# Transform our roots list into a set.

2278

descendants = set(roots)

2282

descendants = set(roots)

2279

# Also, keep the original roots so we can filter out roots that aren't

2283

# Also, keep the original roots so we can filter out roots that aren't

2280

# 'real' roots (i.e. are descended from other roots).

2284

# 'real' roots (i.e. are descended from other roots).

2281

roots = descendants.copy()

2285

roots = descendants.copy()

2282

# Our topologically sorted list of output nodes.

2286

# Our topologically sorted list of output nodes.

2283

orderedout = []

2287

orderedout = []

2284

# Don't start at nullid since we don't want nullid in our output list,

2288

# Don't start at nullid since we don't want nullid in our output list,

2285

# and if nullid shows up in descendants, empty parents will look like

2289

# and if nullid shows up in descendants, empty parents will look like

2286

# they're descendants.

2290

# they're descendants.

2287

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

2291

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

2288

n = self.node(r)

2292

n = self.node(r)

2289

isdescendant = False

2293

isdescendant = False

2290

if lowestrev == nullrev: # Everybody is a descendant of nullid

2294

if lowestrev == nullrev: # Everybody is a descendant of nullid

2291

isdescendant = True

2295

isdescendant = True

2292

elif n in descendants:

2296

elif n in descendants:

2293

# n is already a descendant

2297

# n is already a descendant

2294

isdescendant = True

2298

isdescendant = True

2295

# This check only needs to be done here because all the roots

2299

# This check only needs to be done here because all the roots

2296

# will start being marked is descendants before the loop.

2300

# will start being marked is descendants before the loop.

2297

if n in roots:

2301

if n in roots:

2298

# If n was a root, check if it's a 'real' root.

2302

# If n was a root, check if it's a 'real' root.

2299

p = tuple(self.parents(n))

2303

p = tuple(self.parents(n))

2300

# If any of its parents are descendants, it's not a root.

2304

# If any of its parents are descendants, it's not a root.

2301

if (p[0] in descendants) or (p[1] in descendants):

2305

if (p[0] in descendants) or (p[1] in descendants):

2302

roots.remove(n)

2306

roots.remove(n)

2303

else:

2307

else:

2304

p = tuple(self.parents(n))

2308

p = tuple(self.parents(n))

2305

# A node is a descendant if either of its parents are

2309

# A node is a descendant if either of its parents are

2306

# descendants. (We seeded the dependents list with the roots

2310

# descendants. (We seeded the dependents list with the roots

2307

# up there, remember?)

2311

# up there, remember?)

2308

if (p[0] in descendants) or (p[1] in descendants):

2312

if (p[0] in descendants) or (p[1] in descendants):

2309

descendants.add(n)

2313

descendants.add(n)

2310

isdescendant = True

2314

isdescendant = True

2311

if isdescendant and ((ancestors is None) or (n in ancestors)):

2315

if isdescendant and ((ancestors is None) or (n in ancestors)):

2312

# Only include nodes that are both descendants and ancestors.

2316

# Only include nodes that are both descendants and ancestors.

2313

orderedout.append(n)

2317

orderedout.append(n)

2314

if (ancestors is not None) and (n in heads):

2318

if (ancestors is not None) and (n in heads):

2315

# We're trying to figure out which heads are reachable

2319

# We're trying to figure out which heads are reachable

2316

# from roots.

2320

# from roots.

2317

# Mark this head as having been reached

2321

# Mark this head as having been reached

2318

heads[n] = True

2322

heads[n] = True

2319

elif ancestors is None:

2323

elif ancestors is None:

2320

# Otherwise, we're trying to discover the heads.

2324

# Otherwise, we're trying to discover the heads.

2321

# Assume this is a head because if it isn't, the next step

2325

# Assume this is a head because if it isn't, the next step

2322

# will eventually remove it.

2326

# will eventually remove it.

2323

heads[n] = True

2327

heads[n] = True

2324

# But, obviously its parents aren't.

2328

# But, obviously its parents aren't.

2325

for p in self.parents(n):

2329

for p in self.parents(n):

2326

heads.pop(p, None)

2330

heads.pop(p, None)

2327

heads = [head for head, flag in heads.items() if flag]

2331

heads = [head for head, flag in heads.items() if flag]

2328

roots = list(roots)

2332

roots = list(roots)

2329

assert orderedout

2333

assert orderedout

2330

assert roots

2334

assert roots

2331

assert heads

2335

assert heads

2332

return (orderedout, roots, heads)

2336

return (orderedout, roots, heads)

2333

2337

2334

def headrevs(self, revs=None):

2338

def headrevs(self, revs=None):

2335

if revs is None:

2339

if revs is None:

2336

try:

2340

try:

2337

return self.index.headrevs()

2341

return self.index.headrevs()

2338

except AttributeError:

2342

except AttributeError:

2339

return self._headrevs()

2343

return self._headrevs()

2340

if rustdagop is not None and self.index.rust_ext_compat:

2344

if rustdagop is not None and self.index.rust_ext_compat:

2341

return rustdagop.headrevs(self.index, revs)

2345

return rustdagop.headrevs(self.index, revs)

2342

return dagop.headrevs(revs, self._uncheckedparentrevs)

2346

return dagop.headrevs(revs, self._uncheckedparentrevs)

2343

2347

2344

def computephases(self, roots):

2348

def computephases(self, roots):

2345

return self.index.computephasesmapsets(roots)

2349

return self.index.computephasesmapsets(roots)

2346

2350

2347

def _headrevs(self):

2351

def _headrevs(self):

2348

count = len(self)

2352

count = len(self)

2349

if not count:

2353

if not count:

2350

return [nullrev]

2354

return [nullrev]

2351

# we won't iter over filtered rev so nobody is a head at start

2355

# we won't iter over filtered rev so nobody is a head at start

2352

ishead = [0] * (count + 1)

2356

ishead = [0] * (count + 1)

2353

index = self.index

2357

index = self.index

2354

for r in self:

2358

for r in self:

2355

ishead[r] = 1 # I may be an head

2359

ishead[r] = 1 # I may be an head

2356

e = index[r]

2360

e = index[r]

2357

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

2361

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

2358

return [r for r, val in enumerate(ishead) if val]

2362

return [r for r, val in enumerate(ishead) if val]

2359

2363

2360

def heads(self, start=None, stop=None):

2364

def heads(self, start=None, stop=None):

2361

"""return the list of all nodes that have no children

2365

"""return the list of all nodes that have no children

2362

2366

2363

if start is specified, only heads that are descendants of

2367

if start is specified, only heads that are descendants of

2364

start will be returned

2368

start will be returned

2365

if stop is specified, it will consider all the revs from stop

2369

if stop is specified, it will consider all the revs from stop

2366

as if they had no children

2370

as if they had no children

2367

"""

2371

"""

2368

if start is None and stop is None:

2372

if start is None and stop is None:

2369

if not len(self):

2373

if not len(self):

2370

return [self.nullid]

2374

return [self.nullid]

2371

return [self.node(r) for r in self.headrevs()]

2375

return [self.node(r) for r in self.headrevs()]

2372

2376

2373

if start is None:

2377

if start is None:

2374

start = nullrev

2378

start = nullrev

2375

else:

2379

else:

2376

start = self.rev(start)

2380

start = self.rev(start)

2377

2381

2378

stoprevs = {self.rev(n) for n in stop or []}

2382

stoprevs = {self.rev(n) for n in stop or []}

2379

2383

2380

revs = dagop.headrevssubset(

2384

revs = dagop.headrevssubset(

2381

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

2385

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

2382

)

2386

)

2383

2387

2384

return [self.node(rev) for rev in revs]

2388

return [self.node(rev) for rev in revs]

2385

2389

2386

def children(self, node):

2390

def children(self, node):

2387

"""find the children of a given node"""

2391

"""find the children of a given node"""

2388

c = []

2392

c = []

2389

p = self.rev(node)

2393

p = self.rev(node)

2390

for r in self.revs(start=p + 1):

2394

for r in self.revs(start=p + 1):

2391

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

2395

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

2392

if prevs:

2396

if prevs:

2393

for pr in prevs:

2397

for pr in prevs:

2394

if pr == p:

2398

if pr == p:

2395

c.append(self.node(r))

2399

c.append(self.node(r))

2396

elif p == nullrev:

2400

elif p == nullrev:

2397

c.append(self.node(r))

2401

c.append(self.node(r))

2398

return c

2402

return c

2399

2403

2400

def commonancestorsheads(self, a, b):

2404

def commonancestorsheads(self, a, b):

2401

"""calculate all the heads of the common ancestors of nodes a and b"""

2405

"""calculate all the heads of the common ancestors of nodes a and b"""

2402

a, b = self.rev(a), self.rev(b)

2406

a, b = self.rev(a), self.rev(b)

2403

ancs = self._commonancestorsheads(a, b)

2407

ancs = self._commonancestorsheads(a, b)

2404

return pycompat.maplist(self.node, ancs)

2408

return pycompat.maplist(self.node, ancs)

2405

2409

2406

def _commonancestorsheads(self, *revs):

2410

def _commonancestorsheads(self, *revs):

2407

"""calculate all the heads of the common ancestors of revs"""

2411

"""calculate all the heads of the common ancestors of revs"""

2408

try:

2412

try:

2409

ancs = self.index.commonancestorsheads(*revs)

2413

ancs = self.index.commonancestorsheads(*revs)

2410

except (AttributeError, OverflowError): # C implementation failed

2414

except (AttributeError, OverflowError): # C implementation failed

2411

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

2415

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

2412

return ancs

2416

return ancs

2413

2417

2414

def isancestor(self, a, b):

2418

def isancestor(self, a, b):

2415

"""return True if node a is an ancestor of node b

2419

"""return True if node a is an ancestor of node b

2416

2420

2417

A revision is considered an ancestor of itself."""

2421

A revision is considered an ancestor of itself."""

2418

a, b = self.rev(a), self.rev(b)

2422

a, b = self.rev(a), self.rev(b)

2419

return self.isancestorrev(a, b)

2423

return self.isancestorrev(a, b)

2420

2424

2421

def isancestorrev(self, a, b):

2425

def isancestorrev(self, a, b):

2422

"""return True if revision a is an ancestor of revision b

2426

"""return True if revision a is an ancestor of revision b

2423

2427

2424

A revision is considered an ancestor of itself.

2428

A revision is considered an ancestor of itself.

2425

2429

2426

The implementation of this is trivial but the use of

2430

The implementation of this is trivial but the use of

2427

reachableroots is not."""

2431

reachableroots is not."""

2428

if a == nullrev:

2432

if a == nullrev:

2429

return True

2433

return True

2430

elif a == b:

2434

elif a == b:

2431

return True

2435

return True

2432

elif a > b:

2436

elif a > b:

2433

return False

2437

return False

2434

return bool(self.reachableroots(a, [b], [a], includepath=False))

2438

return bool(self.reachableroots(a, [b], [a], includepath=False))

2435

2439

2436

def reachableroots(self, minroot, heads, roots, includepath=False):

2440

def reachableroots(self, minroot, heads, roots, includepath=False):

2437

"""return (heads(::(<roots> and <roots>::<heads>)))

2441

"""return (heads(::(<roots> and <roots>::<heads>)))

2438

2442

2439

If includepath is True, return (<roots>::<heads>)."""

2443

If includepath is True, return (<roots>::<heads>)."""

2440

try:

2444

try:

2441

return self.index.reachableroots2(

2445

return self.index.reachableroots2(

2442

minroot, heads, roots, includepath

2446

minroot, heads, roots, includepath

2443

)

2447

)

2444

except AttributeError:

2448

except AttributeError:

2445

return dagop._reachablerootspure(

2449

return dagop._reachablerootspure(

2446

self.parentrevs, minroot, roots, heads, includepath

2450

self.parentrevs, minroot, roots, heads, includepath

2447

)

2451

)

2448

2452

2449

def ancestor(self, a, b):

2453

def ancestor(self, a, b):

2450

"""calculate the "best" common ancestor of nodes a and b"""

2454

"""calculate the "best" common ancestor of nodes a and b"""

2451

2455

2452

a, b = self.rev(a), self.rev(b)

2456

a, b = self.rev(a), self.rev(b)

2453

try:

2457

try:

2454

ancs = self.index.ancestors(a, b)

2458

ancs = self.index.ancestors(a, b)

2455

except (AttributeError, OverflowError):

2459

except (AttributeError, OverflowError):

2456

ancs = ancestor.ancestors(self.parentrevs, a, b)

2460

ancs = ancestor.ancestors(self.parentrevs, a, b)

2457

if ancs:

2461

if ancs:

2458

# choose a consistent winner when there's a tie

2462

# choose a consistent winner when there's a tie

2459

return min(map(self.node, ancs))

2463

return min(map(self.node, ancs))

2460

return self.nullid

2464

return self.nullid

2461

2465

2462

def _match(self, id):

2466

def _match(self, id):

2463

if isinstance(id, int):

2467

if isinstance(id, int):

2464

# rev

2468

# rev

2465

return self.node(id)

2469

return self.node(id)

2466

if len(id) == self.nodeconstants.nodelen:

2470

if len(id) == self.nodeconstants.nodelen:

2467

# possibly a binary node

2471

# possibly a binary node

2468

# odds of a binary node being all hex in ASCII are 1 in 10**25

2472

# odds of a binary node being all hex in ASCII are 1 in 10**25

2469

try:

2473

try:

2470

node = id

2474

node = id

2471

self.rev(node) # quick search the index

2475

self.rev(node) # quick search the index

2472

return node

2476

return node

2473

except error.LookupError:

2477

except error.LookupError:

2474

pass # may be partial hex id

2478

pass # may be partial hex id

2475

try:

2479

try:

2476

# str(rev)

2480

# str(rev)

2477

rev = int(id)

2481

rev = int(id)

2478

if b"%d" % rev != id:

2482

if b"%d" % rev != id:

2479

raise ValueError

2483

raise ValueError

2480

if rev < 0:

2484

if rev < 0:

2481

rev = len(self) + rev

2485

rev = len(self) + rev

2482

if rev < 0 or rev >= len(self):

2486

if rev < 0 or rev >= len(self):

2483

raise ValueError

2487

raise ValueError

2484

return self.node(rev)

2488

return self.node(rev)

2485

except (ValueError, OverflowError):

2489

except (ValueError, OverflowError):

2486

pass

2490

pass

2487

if len(id) == 2 * self.nodeconstants.nodelen:

2491

if len(id) == 2 * self.nodeconstants.nodelen:

2488

try:

2492

try:

2489

# a full hex nodeid?

2493

# a full hex nodeid?

2490

node = bin(id)

2494

node = bin(id)

2491

self.rev(node)

2495

self.rev(node)

2492

return node

2496

return node

2493

except (binascii.Error, error.LookupError):

2497

except (binascii.Error, error.LookupError):

2494

pass

2498

pass

2495

2499

2496

def _partialmatch(self, id):

2500

def _partialmatch(self, id):

2497

# we don't care wdirfilenodeids as they should be always full hash

2501

# we don't care wdirfilenodeids as they should be always full hash

2498

maybewdir = self.nodeconstants.wdirhex.startswith(id)

2502

maybewdir = self.nodeconstants.wdirhex.startswith(id)

2499

ambiguous = False

2503

ambiguous = False

2500

try:

2504

try:

2501

partial = self.index.partialmatch(id)

2505

partial = self.index.partialmatch(id)

2502

if partial and self.hasnode(partial):

2506

if partial and self.hasnode(partial):

2503

if maybewdir:

2507

if maybewdir:

2504

# single 'ff...' match in radix tree, ambiguous with wdir

2508

# single 'ff...' match in radix tree, ambiguous with wdir

2505

ambiguous = True

2509

ambiguous = True

2506

else:

2510

else:

2507

return partial

2511

return partial

2508

elif maybewdir:

2512

elif maybewdir:

2509

# no 'ff...' match in radix tree, wdir identified

2513

# no 'ff...' match in radix tree, wdir identified

2510

raise error.WdirUnsupported

2514

raise error.WdirUnsupported

2511

else:

2515

else:

2512

return None

2516

return None

2513

except error.RevlogError:

2517

except error.RevlogError:

2514

# parsers.c radix tree lookup gave multiple matches

2518

# parsers.c radix tree lookup gave multiple matches

2515

# fast path: for unfiltered changelog, radix tree is accurate

2519

# fast path: for unfiltered changelog, radix tree is accurate

2516

if not getattr(self, 'filteredrevs', None):

2520

if not getattr(self, 'filteredrevs', None):

2517

ambiguous = True

2521

ambiguous = True

2518

# fall through to slow path that filters hidden revisions

2522

# fall through to slow path that filters hidden revisions

2519

except (AttributeError, ValueError):

2523

except (AttributeError, ValueError):

2520

# we are pure python, or key is not hex

2524

# we are pure python, or key is not hex

2521

pass

2525

pass

2522

if ambiguous:

2526

if ambiguous:

2523

raise error.AmbiguousPrefixLookupError(

2527

raise error.AmbiguousPrefixLookupError(

2524

id, self.display_id, _(b'ambiguous identifier')

2528

id, self.display_id, _(b'ambiguous identifier')

2525

)

2529

)

2526

2530

2527

if id in self._pcache:

2531

if id in self._pcache:

2528

return self._pcache[id]

2532

return self._pcache[id]

2529

2533

2530

if len(id) <= 40:

2534

if len(id) <= 40:

2531

# hex(node)[:...]

2535

# hex(node)[:...]

2532

l = len(id) // 2 * 2 # grab an even number of digits

2536

l = len(id) // 2 * 2 # grab an even number of digits

2533

try:

2537

try:

2534

# we're dropping the last digit, so let's check that it's hex,

2538

# we're dropping the last digit, so let's check that it's hex,

2535

# to avoid the expensive computation below if it's not

2539

# to avoid the expensive computation below if it's not

2536

if len(id) % 2 > 0:

2540

if len(id) % 2 > 0:

2537

if not (id[-1] in hexdigits):

2541

if not (id[-1] in hexdigits):

2538

return None

2542

return None

2539

prefix = bin(id[:l])

2543

prefix = bin(id[:l])

2540

except binascii.Error:

2544

except binascii.Error:

2541

pass

2545

pass

2542

else:

2546

else:

2543

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

2547

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

2544

nl = [

2548

nl = [

2545

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

2549

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

2546

]

2550

]

2547

if self.nodeconstants.nullhex.startswith(id):

2551

if self.nodeconstants.nullhex.startswith(id):

2548

nl.append(self.nullid)

2552

nl.append(self.nullid)

2549

if len(nl) > 0:

2553

if len(nl) > 0:

2550

if len(nl) == 1 and not maybewdir:

2554

if len(nl) == 1 and not maybewdir:

2551

self._pcache[id] = nl[0]

2555

self._pcache[id] = nl[0]

2552

return nl[0]

2556

return nl[0]

2553

raise error.AmbiguousPrefixLookupError(

2557

raise error.AmbiguousPrefixLookupError(

2554

id, self.display_id, _(b'ambiguous identifier')

2558

id, self.display_id, _(b'ambiguous identifier')

2555

)

2559

)

2556

if maybewdir:

2560

if maybewdir:

2557

raise error.WdirUnsupported

2561

raise error.WdirUnsupported

2558

return None

2562

return None

2559

2563

2560

def lookup(self, id):

2564

def lookup(self, id):

2561

"""locate a node based on:

2565

"""locate a node based on:

2562

- revision number or str(revision number)

2566

- revision number or str(revision number)

2563

- nodeid or subset of hex nodeid

2567

- nodeid or subset of hex nodeid

2564

"""

2568

"""

2565

n = self._match(id)

2569

n = self._match(id)

2566

if n is not None:

2570

if n is not None:

2567

return n

2571

return n

2568

n = self._partialmatch(id)

2572

n = self._partialmatch(id)

2569

if n:

2573

if n:

2570

return n

2574

return n

2571

2575

2572

raise error.LookupError(id, self.display_id, _(b'no match found'))

2576

raise error.LookupError(id, self.display_id, _(b'no match found'))

2573

2577

2574

def shortest(self, node, minlength=1):

2578

def shortest(self, node, minlength=1):

2575

"""Find the shortest unambiguous prefix that matches node."""

2579

"""Find the shortest unambiguous prefix that matches node."""

2576

2580

2577

def isvalid(prefix):

2581

def isvalid(prefix):

2578

try:

2582

try:

2579

matchednode = self._partialmatch(prefix)

2583

matchednode = self._partialmatch(prefix)

2580

except error.AmbiguousPrefixLookupError:

2584

except error.AmbiguousPrefixLookupError:

2581

return False

2585

return False

2582

except error.WdirUnsupported:

2586

except error.WdirUnsupported:

2583

# single 'ff...' match

2587

# single 'ff...' match

2584

return True

2588

return True

2585

if matchednode is None:

2589

if matchednode is None:

2586

raise error.LookupError(node, self.display_id, _(b'no node'))

2590

raise error.LookupError(node, self.display_id, _(b'no node'))

2587

return True

2591

return True

2588

2592

2589

def maybewdir(prefix):

2593

def maybewdir(prefix):

2590

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

2594

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

2591

2595

2592

hexnode = hex(node)

2596

hexnode = hex(node)

2593

2597

2594

def disambiguate(hexnode, minlength):

2598

def disambiguate(hexnode, minlength):

2595

"""Disambiguate against wdirid."""

2599

"""Disambiguate against wdirid."""

2596

for length in range(minlength, len(hexnode) + 1):

2600

for length in range(minlength, len(hexnode) + 1):

2597

prefix = hexnode[:length]

2601

prefix = hexnode[:length]

2598

if not maybewdir(prefix):

2602

if not maybewdir(prefix):

2599

return prefix

2603

return prefix

2600

2604

2601

if not getattr(self, 'filteredrevs', None):

2605

if not getattr(self, 'filteredrevs', None):

2602

try:

2606

try:

2603

length = max(self.index.shortest(node), minlength)

2607

length = max(self.index.shortest(node), minlength)

2604

return disambiguate(hexnode, length)

2608

return disambiguate(hexnode, length)

2605

except error.RevlogError:

2609

except error.RevlogError:

2606

if node != self.nodeconstants.wdirid:

2610

if node != self.nodeconstants.wdirid:

2607

raise error.LookupError(

2611

raise error.LookupError(

2608

node, self.display_id, _(b'no node')

2612

node, self.display_id, _(b'no node')

2609

)

2613

)

2610

except AttributeError:

2614

except AttributeError:

2611

# Fall through to pure code

2615

# Fall through to pure code

2612

pass

2616

pass

2613

2617

2614

if node == self.nodeconstants.wdirid:

2618

if node == self.nodeconstants.wdirid:

2615

for length in range(minlength, len(hexnode) + 1):

2619

for length in range(minlength, len(hexnode) + 1):

2616

prefix = hexnode[:length]

2620

prefix = hexnode[:length]

2617

if isvalid(prefix):

2621

if isvalid(prefix):

2618

return prefix

2622

return prefix

2619

2623

2620

for length in range(minlength, len(hexnode) + 1):

2624

for length in range(minlength, len(hexnode) + 1):

2621

prefix = hexnode[:length]

2625

prefix = hexnode[:length]

2622

if isvalid(prefix):

2626

if isvalid(prefix):

2623

return disambiguate(hexnode, length)

2627

return disambiguate(hexnode, length)

2624

2628

2625

def cmp(self, node, text):

2629

def cmp(self, node, text):

2626

"""compare text with a given file revision

2630

"""compare text with a given file revision

2627

2631

2628

returns True if text is different than what is stored.

2632

returns True if text is different than what is stored.

2629

"""

2633

"""

2630

p1, p2 = self.parents(node)

2634

p1, p2 = self.parents(node)

2631

return storageutil.hashrevisionsha1(text, p1, p2) != node

2635

return storageutil.hashrevisionsha1(text, p1, p2) != node

2632

2636

2633

def deltaparent(self, rev):

2637

def deltaparent(self, rev):

2634

"""return deltaparent of the given revision"""

2638

"""return deltaparent of the given revision"""

2635

base = self.index[rev][3]

2639

base = self.index[rev][3]

2636

if base == rev:

2640

if base == rev:

2637

return nullrev

2641

return nullrev

2638

elif self.delta_config.general_delta:

2642

elif self.delta_config.general_delta:

2639

return base

2643

return base

2640

else:

2644

else:

2641

return rev - 1

2645

return rev - 1

2642

2646

2643

def issnapshot(self, rev):

2647

def issnapshot(self, rev):

2644

"""tells whether rev is a snapshot"""

2648

"""tells whether rev is a snapshot"""

2645

ret = self._inner.issnapshot(rev)

2649

ret = self._inner.issnapshot(rev)

2646

self.issnapshot = self._inner.issnapshot

2650

self.issnapshot = self._inner.issnapshot

2647

return ret

2651

return ret

2648

2652

2649

def snapshotdepth(self, rev):

2653

def snapshotdepth(self, rev):

2650

"""number of snapshot in the chain before this one"""

2654

"""number of snapshot in the chain before this one"""

2651

if not self.issnapshot(rev):

2655

if not self.issnapshot(rev):

2652

raise error.ProgrammingError(b'revision %d not a snapshot')

2656

raise error.ProgrammingError(b'revision %d not a snapshot')

2653

return len(self._inner._deltachain(rev)[0]) - 1

2657

return len(self._inner._deltachain(rev)[0]) - 1

2654

2658

2655

def revdiff(self, rev1, rev2):

2659

def revdiff(self, rev1, rev2):

2656

"""return or calculate a delta between two revisions

2660

"""return or calculate a delta between two revisions

2657

2661

2658

The delta calculated is in binary form and is intended to be written to

2662

The delta calculated is in binary form and is intended to be written to

2659

revlog data directly. So this function needs raw revision data.

2663

revlog data directly. So this function needs raw revision data.

2660

"""

2664

"""

2661

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2665

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2662

return bytes(self._inner._chunk(rev2))

2666

return bytes(self._inner._chunk(rev2))

2663

2667

2664

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2668

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2665

2669

2666

def revision(self, nodeorrev):

2670

def revision(self, nodeorrev):

2667

"""return an uncompressed revision of a given node or revision

2671

"""return an uncompressed revision of a given node or revision

2668

number.

2672

number.

2669

"""

2673

"""

2670

return self._revisiondata(nodeorrev)

2674

return self._revisiondata(nodeorrev)

2671

2675

2672

def sidedata(self, nodeorrev):

2676

def sidedata(self, nodeorrev):

2673

"""a map of extra data related to the changeset but not part of the hash

2677

"""a map of extra data related to the changeset but not part of the hash

2674

2678

2675

This function currently return a dictionary. However, more advanced

2679

This function currently return a dictionary. However, more advanced

2676

mapping object will likely be used in the future for a more

2680

mapping object will likely be used in the future for a more

2677

efficient/lazy code.

2681

efficient/lazy code.

2678

"""

2682

"""

2679

# deal with <nodeorrev> argument type

2683

# deal with <nodeorrev> argument type

2680

if isinstance(nodeorrev, int):

2684

if isinstance(nodeorrev, int):

2681

rev = nodeorrev

2685

rev = nodeorrev

2682

else:

2686

else:

2683

rev = self.rev(nodeorrev)

2687

rev = self.rev(nodeorrev)

2684

return self._sidedata(rev)

2688

return self._sidedata(rev)

2685

2689

2686

def _rawtext(self, node, rev):

2690

def _rawtext(self, node, rev):

2687

"""return the possibly unvalidated rawtext for a revision

2691

"""return the possibly unvalidated rawtext for a revision

2688

2692

2689

returns (rev, rawtext, validated)

2693

returns (rev, rawtext, validated)

2690

"""

2694

"""

2691

# Check if we have the entry in cache

2695

# Check if we have the entry in cache

2692

# The cache entry looks like (node, rev, rawtext)

2696

# The cache entry looks like (node, rev, rawtext)

2693

if self._inner._revisioncache:

2697

if self._inner._revisioncache:

2694

if self._inner._revisioncache[0] == node:

2698

if self._inner._revisioncache[0] == node:

2695

return (rev, self._inner._revisioncache[2], True)

2699

return (rev, self._inner._revisioncache[2], True)

2696

2700

2697

if rev is None:

2701

if rev is None:

2698

rev = self.rev(node)

2702

rev = self.rev(node)

2699

2703

2700

return self._inner.raw_text(node, rev)

2704

return self._inner.raw_text(node, rev)

2701

2705

2702

def _revisiondata(self, nodeorrev, raw=False):

2706

def _revisiondata(self, nodeorrev, raw=False):

2703

# deal with <nodeorrev> argument type

2707

# deal with <nodeorrev> argument type

2704

if isinstance(nodeorrev, int):

2708

if isinstance(nodeorrev, int):

2705

rev = nodeorrev

2709

rev = nodeorrev

2706

node = self.node(rev)

2710

node = self.node(rev)

2707

else:

2711

else:

2708

node = nodeorrev

2712

node = nodeorrev

2709

rev = None

2713

rev = None

2710

2714

2711

# fast path the special `nullid` rev

2715

# fast path the special `nullid` rev

2712

if node == self.nullid:

2716

if node == self.nullid:

2713

return b""

2717

return b""

2714

2718

2715

# ``rawtext`` is the text as stored inside the revlog. Might be the

2719

# ``rawtext`` is the text as stored inside the revlog. Might be the

2716

# revision or might need to be processed to retrieve the revision.

2720

# revision or might need to be processed to retrieve the revision.

2717

rev, rawtext, validated = self._rawtext(node, rev)

2721

rev, rawtext, validated = self._rawtext(node, rev)

2718

2722

2719

if raw and validated:

2723

if raw and validated:

2720

# if we don't want to process the raw text and that raw

2724

# if we don't want to process the raw text and that raw

2721

# text is cached, we can exit early.

2725

# text is cached, we can exit early.

2722

return rawtext

2726

return rawtext

2723

if rev is None:

2727

if rev is None:

2724

rev = self.rev(node)

2728

rev = self.rev(node)

2725

# the revlog's flag for this revision

2729

# the revlog's flag for this revision

2726

# (usually alter its state or content)

2730

# (usually alter its state or content)

2727

flags = self.flags(rev)

2731

flags = self.flags(rev)

2728

2732

2729

if validated and flags == REVIDX_DEFAULT_FLAGS:

2733

if validated and flags == REVIDX_DEFAULT_FLAGS:

2730

# no extra flags set, no flag processor runs, text = rawtext

2734

# no extra flags set, no flag processor runs, text = rawtext

2731

return rawtext

2735

return rawtext

2732

2736

2733

if raw:

2737

if raw:

2734

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2738

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2735

text = rawtext

2739

text = rawtext

2736

else:

2740

else:

2737

r = flagutil.processflagsread(self, rawtext, flags)

2741

r = flagutil.processflagsread(self, rawtext, flags)

2738

text, validatehash = r

2742

text, validatehash = r

2739

if validatehash:

2743

if validatehash:

2740

self.checkhash(text, node, rev=rev)

2744

self.checkhash(text, node, rev=rev)

2741

if not validated:

2745

if not validated:

2742

self._inner._revisioncache = (node, rev, rawtext)

2746

self._inner._revisioncache = (node, rev, rawtext)

2743

2747

2744

return text

2748

return text

2745

2749

2746

def _sidedata(self, rev):

2750

def _sidedata(self, rev):

2747

"""Return the sidedata for a given revision number."""

2751

"""Return the sidedata for a given revision number."""

2748

sidedata_end = None

2752

sidedata_end = None

2749

if self._docket is not None:

2753

if self._docket is not None:

2750

sidedata_end = self._docket.sidedata_end

2754

sidedata_end = self._docket.sidedata_end

2751

return self._inner.sidedata(rev, sidedata_end)

2755

return self._inner.sidedata(rev, sidedata_end)

2752

2756

2753

def rawdata(self, nodeorrev):

2757

def rawdata(self, nodeorrev):

2754

"""return an uncompressed raw data of a given node or revision number."""

2758

"""return an uncompressed raw data of a given node or revision number."""

2755

return self._revisiondata(nodeorrev, raw=True)

2759

return self._revisiondata(nodeorrev, raw=True)

2756

2760

2757

def hash(self, text, p1, p2):

2761

def hash(self, text, p1, p2):

2758

"""Compute a node hash.

2762

"""Compute a node hash.

2759

2763

2760

Available as a function so that subclasses can replace the hash

2764

Available as a function so that subclasses can replace the hash

2761

as needed.

2765

as needed.

2762

"""

2766

"""

2763

return storageutil.hashrevisionsha1(text, p1, p2)

2767

return storageutil.hashrevisionsha1(text, p1, p2)

2764

2768

2765

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2769

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2766

"""Check node hash integrity.

2770

"""Check node hash integrity.

2767

2771

2768

Available as a function so that subclasses can extend hash mismatch

2772

Available as a function so that subclasses can extend hash mismatch

2769

behaviors as needed.

2773

behaviors as needed.

2770

"""

2774

"""

2771

try:

2775

try:

2772

if p1 is None and p2 is None:

2776

if p1 is None and p2 is None:

2773

p1, p2 = self.parents(node)

2777

p1, p2 = self.parents(node)

2774

if node != self.hash(text, p1, p2):

2778

if node != self.hash(text, p1, p2):

2775

# Clear the revision cache on hash failure. The revision cache

2779

# Clear the revision cache on hash failure. The revision cache

2776

# only stores the raw revision and clearing the cache does have

2780

# only stores the raw revision and clearing the cache does have

2777

# the side-effect that we won't have a cache hit when the raw

2781

# the side-effect that we won't have a cache hit when the raw

2778

# revision data is accessed. But this case should be rare and

2782

# revision data is accessed. But this case should be rare and

2779

# it is extra work to teach the cache about the hash

2783

# it is extra work to teach the cache about the hash

2780

# verification state.

2784

# verification state.

2781

if (

2785

if (

2782

self._inner._revisioncache

2786

self._inner._revisioncache

2783

and self._inner._revisioncache[0] == node

2787

and self._inner._revisioncache[0] == node

2784

):

2788

):

2785

self._inner._revisioncache = None

2789

self._inner._revisioncache = None

2786

2790

2787

revornode = rev

2791

revornode = rev

2788

if revornode is None:

2792

if revornode is None:

2789

revornode = templatefilters.short(hex(node))

2793

revornode = templatefilters.short(hex(node))

2790

raise error.RevlogError(

2794

raise error.RevlogError(

2791

_(b"integrity check failed on %s:%s")

2795

_(b"integrity check failed on %s:%s")

2792

% (self.display_id, pycompat.bytestr(revornode))

2796

% (self.display_id, pycompat.bytestr(revornode))

2793

)

2797

)

2794

except error.RevlogError:

2798

except error.RevlogError:

2795

if self.feature_config.censorable and storageutil.iscensoredtext(

2799

if self.feature_config.censorable and storageutil.iscensoredtext(

2796

text

2800

text

2797

):

2801

):

2798

raise error.CensoredNodeError(self.display_id, node, text)

2802

raise error.CensoredNodeError(self.display_id, node, text)

2799

raise

2803

raise

2800

2804

2801

@property

2805

@property

2802

def _split_index_file(self):

2806

def _split_index_file(self):

2803

"""the path where to expect the index of an ongoing splitting operation

2807

"""the path where to expect the index of an ongoing splitting operation

2804

2808

2805

The file will only exist if a splitting operation is in progress, but

2809

The file will only exist if a splitting operation is in progress, but

2806

it is always expected at the same location."""

2810

it is always expected at the same location."""

2807

parts = self.radix.split(b'/')

2811

parts = self.radix.split(b'/')

2808

if len(parts) > 1:

2812

if len(parts) > 1:

2809

# adds a '-s' prefix to the ``data/` or `meta/` base

2813

# adds a '-s' prefix to the ``data/` or `meta/` base

2810

head = parts[0] + b'-s'

2814

head = parts[0] + b'-s'

2811

mids = parts[1:-1]

2815

mids = parts[1:-1]

2812

tail = parts[-1] + b'.i'

2816

tail = parts[-1] + b'.i'

2813

pieces = [head] + mids + [tail]

2817

pieces = [head] + mids + [tail]

2814

return b'/'.join(pieces)

2818

return b'/'.join(pieces)

2815

else:

2819

else:

2816

# the revlog is stored at the root of the store (changelog or

2820

# the revlog is stored at the root of the store (changelog or

2817

# manifest), no risk of collision.

2821

# manifest), no risk of collision.

2818

return self.radix + b'.i.s'

2822

return self.radix + b'.i.s'

2819

2823

2820

def _enforceinlinesize(self, tr, side_write=True):

2824

def _enforceinlinesize(self, tr, side_write=True):

2821

"""Check if the revlog is too big for inline and convert if so.

2825

"""Check if the revlog is too big for inline and convert if so.

2822

2826

2823

This should be called after revisions are added to the revlog. If the

2827

This should be called after revisions are added to the revlog. If the

2824

revlog has grown too large to be an inline revlog, it will convert it

2828

revlog has grown too large to be an inline revlog, it will convert it

2825

to use multiple index and data files.

2829

to use multiple index and data files.

2826

"""

2830

"""

2827

tiprev = len(self) - 1

2831

tiprev = len(self) - 1

2828

total_size = self.start(tiprev) + self.length(tiprev)

2832

total_size = self.start(tiprev) + self.length(tiprev)

2829

if not self._inline or total_size < _maxinline:

2833

if not self._inline or total_size < _maxinline:

2830

return

2834

return

2831

2835

2832

if self._docket is not None:

2836

if self._docket is not None:

2833

msg = b"inline revlog should not have a docket"

2837

msg = b"inline revlog should not have a docket"

2834

raise error.ProgrammingError(msg)

2838

raise error.ProgrammingError(msg)

2835

2839

2836

troffset = tr.findoffset(self._indexfile)

2840

troffset = tr.findoffset(self._inner.canonical_index_file)

2837

if troffset is None:

2841

if troffset is None:

2838

raise error.RevlogError(

2842

raise error.RevlogError(

2839

_(b"%s not found in the transaction") % self._indexfile

2843

_(b"%s not found in the transaction") % self._indexfile

2840

)

2844

)

2841

if troffset:

2845

if troffset:

2842

tr.addbackup(self._indexfile, for_offset=True)

2846

tr.addbackup(self._inner.canonical_index_file, for_offset=True)

2843

tr.add(self._datafile, 0)

2847

tr.add(self._datafile, 0)

2844

2848

2845

new_index_file_path = None

2849

new_index_file_path = None

2846

if side_write:

2850

if side_write:

2847

old_index_file_path = self._indexfile

2851

old_index_file_path = self._indexfile

2848

new_index_file_path = self._split_index_file

2852

new_index_file_path = self._split_index_file

2849

opener = self.opener

2853

opener = self.opener

2850

weak_self = weakref.ref(self)

2854

weak_self = weakref.ref(self)

2851

2855

2852

# the "split" index replace the real index when the transaction is

2856

# the "split" index replace the real index when the transaction is

2853

# finalized

2857

# finalized

2854

def finalize_callback(tr):

2858

def finalize_callback(tr):

2855

opener.rename(

2859

opener.rename(

2856

new_index_file_path,

2860

new_index_file_path,

2857

old_index_file_path,

2861

old_index_file_path,

2858

checkambig=True,

2862

checkambig=True,

2859

)

2863

)

2860

maybe_self = weak_self()

2864

maybe_self = weak_self()

2861

if maybe_self is not None:

2865

if maybe_self is not None:

2862

maybe_self._indexfile = old_index_file_path

2866

maybe_self._indexfile = old_index_file_path

2863

maybe_self._inner.index_file = maybe_self._indexfile

2867

maybe_self._inner.index_file = maybe_self._indexfile

2864

2868

2865

def abort_callback(tr):

2869

def abort_callback(tr):

2866

maybe_self = weak_self()

2870

maybe_self = weak_self()

2867

if maybe_self is not None:

2871

if maybe_self is not None:

2868

maybe_self._indexfile = old_index_file_path

2872

maybe_self._indexfile = old_index_file_path

2869

maybe_self._inner.inline = True

2873

maybe_self._inner.inline = True

2870

maybe_self._inner.index_file = old_index_file_path

2874

maybe_self._inner.index_file = old_index_file_path

2871

2875

2872

tr.registertmp(new_index_file_path)

2876

tr.registertmp(new_index_file_path)

2873

if self.target[1] is not None:

2877

if self.target[1] is not None:

2874

callback_id = b'000-revlog-split-%d-%s' % self.target

2878

callback_id = b'000-revlog-split-%d-%s' % self.target

2875

else:

2879

else:

2876

callback_id = b'000-revlog-split-%d' % self.target[0]

2880

callback_id = b'000-revlog-split-%d' % self.target[0]

2877

tr.addfinalize(callback_id, finalize_callback)

2881

tr.addfinalize(callback_id, finalize_callback)

2878

tr.addabort(callback_id, abort_callback)

2882

tr.addabort(callback_id, abort_callback)

2879

2883

2880

self._format_flags &= ~FLAG_INLINE_DATA

2884

self._format_flags &= ~FLAG_INLINE_DATA

2881

self._inner.split_inline(

2885

self._inner.split_inline(

2882

tr,

2886

tr,

2883

self._format_flags | self._format_version,

2887

self._format_flags | self._format_version,

2884

new_index_file_path=new_index_file_path,

2888

new_index_file_path=new_index_file_path,

2885

)

2889

)

2886

2890

2887

self._inline = False

2891

self._inline = False

2888

if new_index_file_path is not None:

2892

if new_index_file_path is not None:

2889

self._indexfile = new_index_file_path

2893

self._indexfile = new_index_file_path

2890

2894

2891

nodemaputil.setup_persistent_nodemap(tr, self)

2895

nodemaputil.setup_persistent_nodemap(tr, self)

2892

2896

2893

def _nodeduplicatecallback(self, transaction, node):

2897

def _nodeduplicatecallback(self, transaction, node):

2894

"""called when trying to add a node already stored."""

2898

"""called when trying to add a node already stored."""

2895

2899

2896

@contextlib.contextmanager

2900

@contextlib.contextmanager

2897

def reading(self):

2901

def reading(self):

2898

with self._inner.reading():

2902

with self._inner.reading():

2899

yield

2903

yield

2900

2904

2901

@contextlib.contextmanager

2905

@contextlib.contextmanager

2902

def _writing(self, transaction):

2906

def _writing(self, transaction):

2903

if self._trypending:

2907

if self._trypending:

2904

msg = b'try to write in a `trypending` revlog: %s'

2908

msg = b'try to write in a `trypending` revlog: %s'

2905

msg %= self.display_id

2909

msg %= self.display_id

2906

raise error.ProgrammingError(msg)

2910

raise error.ProgrammingError(msg)

2907

if self._inner.is_writing:

2911

if self._inner.is_writing:

2908

yield

2912

yield

2909

else:

2913

else:

2910

data_end = None

2914

data_end = None

2911

sidedata_end = None

2915

sidedata_end = None

2912

if self._docket is not None:

2916

if self._docket is not None:

2913

data_end = self._docket.data_end

2917

data_end = self._docket.data_end

2914

sidedata_end = self._docket.sidedata_end

2918

sidedata_end = self._docket.sidedata_end

2915

with self._inner.writing(

2919

with self._inner.writing(

2916

transaction,

2920

transaction,

2917

data_end=data_end,

2921

data_end=data_end,

2918

sidedata_end=sidedata_end,

2922

sidedata_end=sidedata_end,

2919

):

2923

):

2920

yield

2924

yield

2921

if self._docket is not None:

2925

if self._docket is not None:

2922

self._write_docket(transaction)

2926

self._write_docket(transaction)

2923

2927

2924

def _write_docket(self, transaction):

2928

def _write_docket(self, transaction):

2925

"""write the current docket on disk

2929

"""write the current docket on disk

2926

2930

2927

Exist as a method to help changelog to implement transaction logic

2931

Exist as a method to help changelog to implement transaction logic

2928

2932

2929

We could also imagine using the same transaction logic for all revlog

2933

We could also imagine using the same transaction logic for all revlog

2930

since docket are cheap."""

2934

since docket are cheap."""

2931

self._docket.write(transaction)

2935

self._docket.write(transaction)

2932

2936

2933

def addrevision(

2937

def addrevision(

2934

self,

2938

self,

2935

text,

2939

text,

2936

transaction,

2940

transaction,

2937

link,

2941

link,

2938

p1,

2942

p1,

2939

p2,

2943

p2,

2940

cachedelta=None,

2944

cachedelta=None,

2941

node=None,

2945

node=None,

2942

flags=REVIDX_DEFAULT_FLAGS,

2946

flags=REVIDX_DEFAULT_FLAGS,

2943

deltacomputer=None,

2947

deltacomputer=None,

2944

sidedata=None,

2948

sidedata=None,

2945

):

2949

):

2946

"""add a revision to the log

2950

"""add a revision to the log

2947

2951

2948

text - the revision data to add

2952

text - the revision data to add

2949

transaction - the transaction object used for rollback

2953

transaction - the transaction object used for rollback

2950

link - the linkrev data to add

2954

link - the linkrev data to add

2951

p1, p2 - the parent nodeids of the revision

2955

p1, p2 - the parent nodeids of the revision

2952

cachedelta - an optional precomputed delta

2956

cachedelta - an optional precomputed delta

2953

node - nodeid of revision; typically node is not specified, and it is

2957

node - nodeid of revision; typically node is not specified, and it is

2954

computed by default as hash(text, p1, p2), however subclasses might

2958

computed by default as hash(text, p1, p2), however subclasses might

2955

use different hashing method (and override checkhash() in such case)

2959

use different hashing method (and override checkhash() in such case)

2956

flags - the known flags to set on the revision

2960

flags - the known flags to set on the revision

2957

deltacomputer - an optional deltacomputer instance shared between

2961

deltacomputer - an optional deltacomputer instance shared between

2958

multiple calls

2962

multiple calls

2959

"""

2963

"""

2960

if link == nullrev:

2964

if link == nullrev:

2961

raise error.RevlogError(

2965

raise error.RevlogError(

2962

_(b"attempted to add linkrev -1 to %s") % self.display_id

2966

_(b"attempted to add linkrev -1 to %s") % self.display_id

2963

)

2967

)

2964

2968

2965

if sidedata is None:

2969

if sidedata is None:

2966

sidedata = {}

2970

sidedata = {}

2967

elif sidedata and not self.feature_config.has_side_data:

2971

elif sidedata and not self.feature_config.has_side_data:

2968

raise error.ProgrammingError(

2972

raise error.ProgrammingError(

2969

_(b"trying to add sidedata to a revlog who don't support them")

2973

_(b"trying to add sidedata to a revlog who don't support them")

2970

)

2974

)

2971

2975

2972

if flags:

2976

if flags:

2973

node = node or self.hash(text, p1, p2)

2977

node = node or self.hash(text, p1, p2)

2974

2978

2975

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2979

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2976

2980

2977

# If the flag processor modifies the revision data, ignore any provided

2981

# If the flag processor modifies the revision data, ignore any provided

2978

# cachedelta.

2982

# cachedelta.

2979

if rawtext != text:

2983

if rawtext != text:

2980

cachedelta = None

2984

cachedelta = None

2981

2985

2982

if len(rawtext) > _maxentrysize:

2986

if len(rawtext) > _maxentrysize:

2983

raise error.RevlogError(

2987

raise error.RevlogError(

2984

_(

2988

_(

2985

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2989

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2986

)

2990

)

2987

% (self.display_id, len(rawtext))

2991

% (self.display_id, len(rawtext))

2988

)

2992

)

2989

2993

2990

node = node or self.hash(rawtext, p1, p2)

2994

node = node or self.hash(rawtext, p1, p2)

2991

rev = self.index.get_rev(node)

2995

rev = self.index.get_rev(node)

2992

if rev is not None:

2996

if rev is not None:

2993

return rev

2997

return rev

2994

2998

2995

if validatehash:

2999

if validatehash:

2996

self.checkhash(rawtext, node, p1=p1, p2=p2)

3000

self.checkhash(rawtext, node, p1=p1, p2=p2)

2997

3001

2998

return self.addrawrevision(

3002

return self.addrawrevision(

2999

rawtext,

3003

rawtext,

3000

transaction,

3004

transaction,

3001

link,

3005

link,

3002

p1,

3006

p1,

3003

p2,

3007

p2,

3004

node,

3008

node,

3005

flags,

3009

flags,

3006

cachedelta=cachedelta,

3010

cachedelta=cachedelta,

3007

deltacomputer=deltacomputer,

3011

deltacomputer=deltacomputer,

3008

sidedata=sidedata,

3012

sidedata=sidedata,

3009

)

3013

)

3010

3014

3011

def addrawrevision(

3015

def addrawrevision(

3012

self,

3016

self,

3013

rawtext,

3017

rawtext,

3014

transaction,

3018

transaction,

3015

link,

3019

link,

3016

p1,

3020

p1,

3017

p2,

3021

p2,

3018

node,

3022

node,

3019

flags,

3023

flags,

3020

cachedelta=None,

3024

cachedelta=None,

3021

deltacomputer=None,

3025

deltacomputer=None,

3022

sidedata=None,

3026

sidedata=None,

3023

):

3027

):

3024

"""add a raw revision with known flags, node and parents

3028

"""add a raw revision with known flags, node and parents

3025

useful when reusing a revision not stored in this revlog (ex: received

3029

useful when reusing a revision not stored in this revlog (ex: received

3026

over wire, or read from an external bundle).

3030

over wire, or read from an external bundle).

3027

"""

3031

"""

3028

with self._writing(transaction):

3032

with self._writing(transaction):

3029

return self._addrevision(

3033

return self._addrevision(

3030

node,

3034

node,

3031

rawtext,

3035

rawtext,

3032

transaction,

3036

transaction,

3033

link,

3037

link,

3034

p1,

3038

p1,

3035

p2,

3039

p2,

3036

flags,

3040

flags,

3037

cachedelta,

3041

cachedelta,

3038

deltacomputer=deltacomputer,

3042

deltacomputer=deltacomputer,

3039

sidedata=sidedata,

3043

sidedata=sidedata,

3040

)

3044

)

3041

3045

3042

def compress(self, data):

3046

def compress(self, data):

3043

return self._inner.compress(data)

3047

return self._inner.compress(data)

3044

3048

3045

def decompress(self, data):

3049

def decompress(self, data):

3046

return self._inner.decompress(data)

3050

return self._inner.decompress(data)

3047

3051

3048

def _addrevision(

3052

def _addrevision(

3049

self,

3053

self,

3050

node,

3054

node,

3051

rawtext,

3055

rawtext,

3052

transaction,

3056

transaction,

3053

link,

3057

link,

3054

p1,

3058

p1,

3055

p2,

3059

p2,

3056

flags,

3060

flags,

3057

cachedelta,

3061

cachedelta,

3058

alwayscache=False,

3062

alwayscache=False,

3059

deltacomputer=None,

3063

deltacomputer=None,

3060

sidedata=None,

3064

sidedata=None,

3061

):

3065

):

3062

"""internal function to add revisions to the log

3066

"""internal function to add revisions to the log

3063

3067

3064

see addrevision for argument descriptions.

3068

see addrevision for argument descriptions.

3065

3069

3066

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

3070

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

3067

3071

3068

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

3072

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

3069

be used.

3073

be used.

3070

3074

3071

invariants:

3075

invariants:

3072

- rawtext is optional (can be None); if not set, cachedelta must be set.

3076

- rawtext is optional (can be None); if not set, cachedelta must be set.

3073

if both are set, they must correspond to each other.

3077

if both are set, they must correspond to each other.

3074

"""

3078

"""

3075

if node == self.nullid:

3079

if node == self.nullid:

3076

raise error.RevlogError(

3080

raise error.RevlogError(

3077

_(b"%s: attempt to add null revision") % self.display_id

3081

_(b"%s: attempt to add null revision") % self.display_id

3078

)

3082

)

3079

if (

3083

if (

3080

node == self.nodeconstants.wdirid

3084

node == self.nodeconstants.wdirid

3081

or node in self.nodeconstants.wdirfilenodeids

3085

or node in self.nodeconstants.wdirfilenodeids

3082

):

3086

):

3083

raise error.RevlogError(

3087

raise error.RevlogError(

3084

_(b"%s: attempt to add wdir revision") % self.display_id

3088

_(b"%s: attempt to add wdir revision") % self.display_id

3085

)

3089

)

3086

if self._inner._writinghandles is None:

3090

if self._inner._writinghandles is None:

3087

msg = b'adding revision outside `revlog._writing` context'

3091

msg = b'adding revision outside `revlog._writing` context'

3088

raise error.ProgrammingError(msg)

3092

raise error.ProgrammingError(msg)

3089

3093

3090

btext = [rawtext]

3094

btext = [rawtext]

3091

3095

3092

curr = len(self)

3096

curr = len(self)

3093

prev = curr - 1

3097

prev = curr - 1

3094

3098

3095

offset = self._get_data_offset(prev)

3099

offset = self._get_data_offset(prev)

3096

3100

3097

if self._concurrencychecker:

3101

if self._concurrencychecker:

3098

ifh, dfh, sdfh = self._inner._writinghandles

3102

ifh, dfh, sdfh = self._inner._writinghandles

3099

# XXX no checking for the sidedata file

3103

# XXX no checking for the sidedata file

3100

if self._inline:

3104

if self._inline:

3101

# offset is "as if" it were in the .d file, so we need to add on

3105

# offset is "as if" it were in the .d file, so we need to add on

3102

# the size of the entry metadata.

3106

# the size of the entry metadata.

3103

self._concurrencychecker(

3107

self._concurrencychecker(

3104

ifh, self._indexfile, offset + curr * self.index.entry_size

3108

ifh, self._indexfile, offset + curr * self.index.entry_size

3105

)

3109

)

3106

else:

3110

else:

3107

# Entries in the .i are a consistent size.

3111

# Entries in the .i are a consistent size.

3108

self._concurrencychecker(

3112

self._concurrencychecker(

3109

ifh, self._indexfile, curr * self.index.entry_size

3113

ifh, self._indexfile, curr * self.index.entry_size

3110

)

3114

)

3111

self._concurrencychecker(dfh, self._datafile, offset)

3115

self._concurrencychecker(dfh, self._datafile, offset)

3112

3116

3113

p1r, p2r = self.rev(p1), self.rev(p2)

3117

p1r, p2r = self.rev(p1), self.rev(p2)

3114

3118

3115

# full versions are inserted when the needed deltas

3119

# full versions are inserted when the needed deltas

3116

# become comparable to the uncompressed text

3120

# become comparable to the uncompressed text

3117

if rawtext is None:

3121

if rawtext is None:

3118

# need rawtext size, before changed by flag processors, which is

3122

# need rawtext size, before changed by flag processors, which is

3119

# the non-raw size. use revlog explicitly to avoid filelog's extra

3123

# the non-raw size. use revlog explicitly to avoid filelog's extra

3120

# logic that might remove metadata size.

3124

# logic that might remove metadata size.

3121

textlen = mdiff.patchedsize(

3125

textlen = mdiff.patchedsize(

3122

revlog.size(self, cachedelta[0]), cachedelta[1]

3126

revlog.size(self, cachedelta[0]), cachedelta[1]

3123

)

3127

)

3124

else:

3128

else:

3125

textlen = len(rawtext)

3129

textlen = len(rawtext)

3126

3130

3127

if deltacomputer is None:

3131

if deltacomputer is None:

3128

write_debug = None

3132

write_debug = None

3129

if self.delta_config.debug_delta:

3133

if self.delta_config.debug_delta:

3130

write_debug = transaction._report

3134

write_debug = transaction._report

3131

deltacomputer = deltautil.deltacomputer(

3135

deltacomputer = deltautil.deltacomputer(

3132

self, write_debug=write_debug

3136

self, write_debug=write_debug

3133

)

3137

)

3134

3138

3135

if cachedelta is not None and len(cachedelta) == 2:

3139

if cachedelta is not None and len(cachedelta) == 2:

3136

# If the cached delta has no information about how it should be

3140

# If the cached delta has no information about how it should be

3137

# reused, add the default reuse instruction according to the

3141

# reused, add the default reuse instruction according to the

3138

# revlog's configuration.

3142

# revlog's configuration.

3139

if (

3143

if (

3140

self.delta_config.general_delta

3144

self.delta_config.general_delta

3141

and self.delta_config.lazy_delta_base

3145

and self.delta_config.lazy_delta_base

3142

):

3146

):

3143

delta_base_reuse = DELTA_BASE_REUSE_TRY

3147

delta_base_reuse = DELTA_BASE_REUSE_TRY

3144

else:

3148

else:

3145

delta_base_reuse = DELTA_BASE_REUSE_NO

3149

delta_base_reuse = DELTA_BASE_REUSE_NO

3146

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

3150

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

3147

3151

3148

revinfo = revlogutils.revisioninfo(

3152

revinfo = revlogutils.revisioninfo(

3149

node,

3153

node,

3150

p1,

3154

p1,

3151

p2,

3155

p2,

3152

btext,

3156

btext,

3153

textlen,

3157

textlen,

3154

cachedelta,

3158

cachedelta,

3155

flags,

3159

flags,

3156

)

3160

)

3157

3161

3158

deltainfo = deltacomputer.finddeltainfo(revinfo)

3162

deltainfo = deltacomputer.finddeltainfo(revinfo)

3159

3163

3160

compression_mode = COMP_MODE_INLINE

3164

compression_mode = COMP_MODE_INLINE

3161

if self._docket is not None:

3165

if self._docket is not None:

3162

default_comp = self._docket.default_compression_header

3166

default_comp = self._docket.default_compression_header

3163

r = deltautil.delta_compression(default_comp, deltainfo)

3167

r = deltautil.delta_compression(default_comp, deltainfo)

3164

compression_mode, deltainfo = r

3168

compression_mode, deltainfo = r

3165

3169

3166

sidedata_compression_mode = COMP_MODE_INLINE

3170

sidedata_compression_mode = COMP_MODE_INLINE

3167

if sidedata and self.feature_config.has_side_data:

3171

if sidedata and self.feature_config.has_side_data:

3168

sidedata_compression_mode = COMP_MODE_PLAIN

3172

sidedata_compression_mode = COMP_MODE_PLAIN

3169

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

3173

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

3170

sidedata_offset = self._docket.sidedata_end

3174

sidedata_offset = self._docket.sidedata_end

3171

h, comp_sidedata = self._inner.compress(serialized_sidedata)

3175

h, comp_sidedata = self._inner.compress(serialized_sidedata)

3172

if (

3176

if (

3173

h != b'u'

3177

h != b'u'

3174

and comp_sidedata[0:1] != b'\0'

3178

and comp_sidedata[0:1] != b'\0'

3175

and len(comp_sidedata) < len(serialized_sidedata)

3179

and len(comp_sidedata) < len(serialized_sidedata)

3176

):

3180

):

3177

assert not h

3181

assert not h

3178

if (

3182

if (

3179

comp_sidedata[0:1]

3183

comp_sidedata[0:1]

3180

== self._docket.default_compression_header

3184

== self._docket.default_compression_header

3181

):

3185

):

3182

sidedata_compression_mode = COMP_MODE_DEFAULT

3186

sidedata_compression_mode = COMP_MODE_DEFAULT

3183

serialized_sidedata = comp_sidedata

3187

serialized_sidedata = comp_sidedata

3184

else:

3188

else:

3185

sidedata_compression_mode = COMP_MODE_INLINE

3189

sidedata_compression_mode = COMP_MODE_INLINE

3186

serialized_sidedata = comp_sidedata

3190

serialized_sidedata = comp_sidedata

3187

else:

3191

else:

3188

serialized_sidedata = b""

3192

serialized_sidedata = b""

3189

# Don't store the offset if the sidedata is empty, that way

3193

# Don't store the offset if the sidedata is empty, that way

3190

# we can easily detect empty sidedata and they will be no different

3194

# we can easily detect empty sidedata and they will be no different

3191

# than ones we manually add.

3195

# than ones we manually add.

3192

sidedata_offset = 0

3196

sidedata_offset = 0

3193

3197

3194

rank = RANK_UNKNOWN

3198

rank = RANK_UNKNOWN

3195

if self.feature_config.compute_rank:

3199

if self.feature_config.compute_rank:

3196

if (p1r, p2r) == (nullrev, nullrev):

3200

if (p1r, p2r) == (nullrev, nullrev):

3197

rank = 1

3201

rank = 1

3198

elif p1r != nullrev and p2r == nullrev:

3202

elif p1r != nullrev and p2r == nullrev:

3199

rank = 1 + self.fast_rank(p1r)

3203

rank = 1 + self.fast_rank(p1r)

3200

elif p1r == nullrev and p2r != nullrev:

3204

elif p1r == nullrev and p2r != nullrev:

3201

rank = 1 + self.fast_rank(p2r)

3205

rank = 1 + self.fast_rank(p2r)

3202

else: # merge node

3206

else: # merge node

3203

if rustdagop is not None and self.index.rust_ext_compat:

3207

if rustdagop is not None and self.index.rust_ext_compat:

3204

rank = rustdagop.rank(self.index, p1r, p2r)

3208

rank = rustdagop.rank(self.index, p1r, p2r)

3205

else:

3209

else:

3206

pmin, pmax = sorted((p1r, p2r))

3210

pmin, pmax = sorted((p1r, p2r))

3207

rank = 1 + self.fast_rank(pmax)

3211

rank = 1 + self.fast_rank(pmax)

3208

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

3212

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

3209

3213

3210

e = revlogutils.entry(

3214

e = revlogutils.entry(

3211

flags=flags,

3215

flags=flags,

3212

data_offset=offset,

3216

data_offset=offset,

3213

data_compressed_length=deltainfo.deltalen,

3217

data_compressed_length=deltainfo.deltalen,

3214

data_uncompressed_length=textlen,

3218

data_uncompressed_length=textlen,

3215

data_compression_mode=compression_mode,

3219

data_compression_mode=compression_mode,

3216

data_delta_base=deltainfo.base,

3220

data_delta_base=deltainfo.base,

3217

link_rev=link,

3221

link_rev=link,

3218

parent_rev_1=p1r,

3222

parent_rev_1=p1r,

3219

parent_rev_2=p2r,

3223

parent_rev_2=p2r,

3220

node_id=node,

3224

node_id=node,

3221

sidedata_offset=sidedata_offset,

3225

sidedata_offset=sidedata_offset,

3222

sidedata_compressed_length=len(serialized_sidedata),

3226

sidedata_compressed_length=len(serialized_sidedata),

3223

sidedata_compression_mode=sidedata_compression_mode,

3227

sidedata_compression_mode=sidedata_compression_mode,

3224

rank=rank,

3228

rank=rank,

3225

)

3229

)

3226

3230

3227

self.index.append(e)

3231

self.index.append(e)

3228

entry = self.index.entry_binary(curr)

3232

entry = self.index.entry_binary(curr)

3229

if curr == 0 and self._docket is None:

3233

if curr == 0 and self._docket is None:

3230

header = self._format_flags | self._format_version

3234

header = self._format_flags | self._format_version

3231

header = self.index.pack_header(header)

3235

header = self.index.pack_header(header)

3232

entry = header + entry

3236

entry = header + entry

3233

self._writeentry(

3237

self._writeentry(

3234

transaction,

3238

transaction,

3235

entry,

3239

entry,

3236

deltainfo.data,

3240

deltainfo.data,

3237

link,

3241

link,

3238

offset,

3242

offset,

3239

serialized_sidedata,

3243

serialized_sidedata,

3240

sidedata_offset,

3244

sidedata_offset,

3241

)

3245

)

3242

3246

3243

rawtext = btext[0]

3247

rawtext = btext[0]

3244

3248

3245

if alwayscache and rawtext is None:

3249

if alwayscache and rawtext is None:

3246

rawtext = deltacomputer.buildtext(revinfo)

3250

rawtext = deltacomputer.buildtext(revinfo)

3247

3251

3248

if type(rawtext) == bytes: # only accept immutable objects

3252

if type(rawtext) == bytes: # only accept immutable objects

3249

self._inner._revisioncache = (node, curr, rawtext)

3253

self._inner._revisioncache = (node, curr, rawtext)

3250

self._chainbasecache[curr] = deltainfo.chainbase

3254

self._chainbasecache[curr] = deltainfo.chainbase

3251

return curr

3255

return curr

3252

3256

3253

def _get_data_offset(self, prev):

3257

def _get_data_offset(self, prev):

3254

"""Returns the current offset in the (in-transaction) data file.

3258

"""Returns the current offset in the (in-transaction) data file.

3255

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

3259

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

3256

file to store that information: since sidedata can be rewritten to the

3260

file to store that information: since sidedata can be rewritten to the

3257

end of the data file within a transaction, you can have cases where, for

3261

end of the data file within a transaction, you can have cases where, for

3258

example, rev `n` does not have sidedata while rev `n - 1` does, leading

3262

example, rev `n` does not have sidedata while rev `n - 1` does, leading

3259

to `n - 1`'s sidedata being written after `n`'s data.

3263

to `n - 1`'s sidedata being written after `n`'s data.

3260

3264

3261

TODO cache this in a docket file before getting out of experimental."""

3265

TODO cache this in a docket file before getting out of experimental."""

3262

if self._docket is None:

3266

if self._docket is None:

3263

return self.end(prev)

3267

return self.end(prev)

3264

else:

3268

else:

3265

return self._docket.data_end

3269

return self._docket.data_end

3266

3270

3267

def _writeentry(

3271

def _writeentry(

3268

self,

3272

self,

3269

transaction,

3273

transaction,

3270

entry,

3274

entry,

3271

data,

3275

data,

3272

link,

3276

link,

3273

offset,

3277

offset,

3274

sidedata,

3278

sidedata,

3275

sidedata_offset,

3279

sidedata_offset,

3276

):

3280

):

3277

# Files opened in a+ mode have inconsistent behavior on various

3281

# Files opened in a+ mode have inconsistent behavior on various

3278

# platforms. Windows requires that a file positioning call be made

3282

# platforms. Windows requires that a file positioning call be made

3279

# when the file handle transitions between reads and writes. See

3283

# when the file handle transitions between reads and writes. See

3280

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

3284

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

3281

# platforms, Python or the platform itself can be buggy. Some versions

3285

# platforms, Python or the platform itself can be buggy. Some versions

3282

# of Solaris have been observed to not append at the end of the file

3286

# of Solaris have been observed to not append at the end of the file

3283

# if the file was seeked to before the end. See issue4943 for more.

3287

# if the file was seeked to before the end. See issue4943 for more.

3284

#

3288

#

3285

# We work around this issue by inserting a seek() before writing.

3289

# We work around this issue by inserting a seek() before writing.

3286

# Note: This is likely not necessary on Python 3. However, because

3290

# Note: This is likely not necessary on Python 3. However, because

3287

# the file handle is reused for reads and may be seeked there, we need

3291

# the file handle is reused for reads and may be seeked there, we need

3288

# to be careful before changing this.

3292

# to be careful before changing this.

3289

index_end = data_end = sidedata_end = None

3293

index_end = data_end = sidedata_end = None

3290

if self._docket is not None:

3294

if self._docket is not None:

3291

index_end = self._docket.index_end

3295

index_end = self._docket.index_end

3292

data_end = self._docket.data_end

3296

data_end = self._docket.data_end

3293

sidedata_end = self._docket.sidedata_end

3297

sidedata_end = self._docket.sidedata_end

3294

3298

3295

files_end = self._inner.write_entry(

3299

files_end = self._inner.write_entry(

3296

transaction,

3300

transaction,

3297

entry,

3301

entry,

3298

data,

3302

data,

3299

link,

3303

link,

3300

offset,

3304

offset,

3301

sidedata,

3305

sidedata,

3302

sidedata_offset,

3306

sidedata_offset,

3303

index_end,

3307

index_end,

3304

data_end,

3308

data_end,

3305

sidedata_end,

3309

sidedata_end,

3306

)

3310

)

3307

self._enforceinlinesize(transaction)

3311

self._enforceinlinesize(transaction)

3308

if self._docket is not None:

3312

if self._docket is not None:

3309

self._docket.index_end = files_end[0]

3313

self._docket.index_end = files_end[0]

3310

self._docket.data_end = files_end[1]

3314

self._docket.data_end = files_end[1]

3311

self._docket.sidedata_end = files_end[2]

3315

self._docket.sidedata_end = files_end[2]

3312

3316

3313

nodemaputil.setup_persistent_nodemap(transaction, self)

3317

nodemaputil.setup_persistent_nodemap(transaction, self)

3314

3318

3315

def addgroup(

3319

def addgroup(

3316

self,

3320

self,

3317

deltas,

3321

deltas,

3318

linkmapper,

3322

linkmapper,

3319

transaction,

3323

transaction,

3320

alwayscache=False,

3324

alwayscache=False,

3321

addrevisioncb=None,

3325

addrevisioncb=None,

3322

duplicaterevisioncb=None,

3326

duplicaterevisioncb=None,

3323

debug_info=None,

3327

debug_info=None,

3324

delta_base_reuse_policy=None,

3328

delta_base_reuse_policy=None,

3325

):

3329

):

3326

"""

3330

"""

3327

add a delta group

3331

add a delta group

3328

3332

3329

given a set of deltas, add them to the revision log. the

3333

given a set of deltas, add them to the revision log. the

3330

first delta is against its parent, which should be in our

3334

first delta is against its parent, which should be in our

3331

log, the rest are against the previous delta.

3335

log, the rest are against the previous delta.

3332

3336

3333

If ``addrevisioncb`` is defined, it will be called with arguments of

3337

If ``addrevisioncb`` is defined, it will be called with arguments of

3334

this revlog and the node that was added.

3338

this revlog and the node that was added.

3335

"""

3339

"""

3336

3340

3337

if self._adding_group:

3341

if self._adding_group:

3338

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3342

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3339

3343

3340

# read the default delta-base reuse policy from revlog config if the

3344

# read the default delta-base reuse policy from revlog config if the

3341

# group did not specify one.

3345

# group did not specify one.

3342

if delta_base_reuse_policy is None:

3346

if delta_base_reuse_policy is None:

3343

if (

3347

if (

3344

self.delta_config.general_delta

3348

self.delta_config.general_delta

3345

and self.delta_config.lazy_delta_base

3349

and self.delta_config.lazy_delta_base

3346

):

3350

):

3347

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3351

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3348

else:

3352

else:

3349

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3353

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3350

3354

3351

self._adding_group = True

3355

self._adding_group = True

3352

empty = True

3356

empty = True

3353

try:

3357

try:

3354

with self._writing(transaction):

3358

with self._writing(transaction):

3355

write_debug = None

3359

write_debug = None

3356

if self.delta_config.debug_delta:

3360

if self.delta_config.debug_delta:

3357

write_debug = transaction._report

3361

write_debug = transaction._report

3358

deltacomputer = deltautil.deltacomputer(

3362

deltacomputer = deltautil.deltacomputer(

3359

self,

3363

self,

3360

write_debug=write_debug,

3364

write_debug=write_debug,

3361

debug_info=debug_info,

3365

debug_info=debug_info,

3362

)

3366

)

3363

# loop through our set of deltas

3367

# loop through our set of deltas

3364

for data in deltas:

3368

for data in deltas:

3365

(

3369

(

3366

node,

3370

node,

3367

p1,

3371

p1,

3368

p2,

3372

p2,

3369

linknode,

3373

linknode,

3370

deltabase,

3374

deltabase,

3371

delta,

3375

delta,

3372

flags,

3376

flags,

3373

sidedata,

3377

sidedata,

3374

) = data

3378

) = data

3375

link = linkmapper(linknode)

3379

link = linkmapper(linknode)

3376

flags = flags or REVIDX_DEFAULT_FLAGS

3380

flags = flags or REVIDX_DEFAULT_FLAGS

3377

3381

3378

rev = self.index.get_rev(node)

3382

rev = self.index.get_rev(node)

3379

if rev is not None:

3383

if rev is not None:

3380

# this can happen if two branches make the same change

3384

# this can happen if two branches make the same change

3381

self._nodeduplicatecallback(transaction, rev)

3385

self._nodeduplicatecallback(transaction, rev)

3382

if duplicaterevisioncb:

3386

if duplicaterevisioncb:

3383

duplicaterevisioncb(self, rev)

3387

duplicaterevisioncb(self, rev)

3384

empty = False

3388

empty = False

3385

continue

3389

continue

3386

3390

3387

for p in (p1, p2):

3391

for p in (p1, p2):

3388

if not self.index.has_node(p):

3392

if not self.index.has_node(p):

3389

raise error.LookupError(

3393

raise error.LookupError(

3390

p, self.radix, _(b'unknown parent')

3394

p, self.radix, _(b'unknown parent')

3391

)

3395

)

3392

3396

3393

if not self.index.has_node(deltabase):

3397

if not self.index.has_node(deltabase):

3394

raise error.LookupError(

3398

raise error.LookupError(

3395

deltabase, self.display_id, _(b'unknown delta base')

3399

deltabase, self.display_id, _(b'unknown delta base')

3396

)

3400

)

3397

3401

3398

baserev = self.rev(deltabase)

3402

baserev = self.rev(deltabase)

3399

3403

3400

if baserev != nullrev and self.iscensored(baserev):

3404

if baserev != nullrev and self.iscensored(baserev):

3401

# if base is censored, delta must be full replacement in a

3405

# if base is censored, delta must be full replacement in a

3402

# single patch operation

3406

# single patch operation

3403

hlen = struct.calcsize(b">lll")

3407

hlen = struct.calcsize(b">lll")

3404

oldlen = self.rawsize(baserev)

3408

oldlen = self.rawsize(baserev)

3405

newlen = len(delta) - hlen

3409

newlen = len(delta) - hlen

3406

if delta[:hlen] != mdiff.replacediffheader(

3410

if delta[:hlen] != mdiff.replacediffheader(

3407

oldlen, newlen

3411

oldlen, newlen

3408

):

3412

):

3409

raise error.CensoredBaseError(

3413

raise error.CensoredBaseError(

3410

self.display_id, self.node(baserev)

3414

self.display_id, self.node(baserev)

3411

)

3415

)

3412

3416

3413

if not flags and self._peek_iscensored(baserev, delta):

3417

if not flags and self._peek_iscensored(baserev, delta):

3414

flags |= REVIDX_ISCENSORED

3418

flags |= REVIDX_ISCENSORED

3415

3419

3416

# We assume consumers of addrevisioncb will want to retrieve

3420

# We assume consumers of addrevisioncb will want to retrieve

3417

# the added revision, which will require a call to

3421

# the added revision, which will require a call to

3418

# revision(). revision() will fast path if there is a cache

3422

# revision(). revision() will fast path if there is a cache

3419

# hit. So, we tell _addrevision() to always cache in this case.

3423

# hit. So, we tell _addrevision() to always cache in this case.

3420

# We're only using addgroup() in the context of changegroup

3424

# We're only using addgroup() in the context of changegroup

3421

# generation so the revision data can always be handled as raw

3425

# generation so the revision data can always be handled as raw

3422

# by the flagprocessor.

3426

# by the flagprocessor.

3423

rev = self._addrevision(

3427

rev = self._addrevision(

3424

node,

3428

node,

3425

None,

3429

None,

3426

transaction,

3430

transaction,

3427

link,

3431

link,

3428

p1,

3432

p1,

3429

p2,

3433

p2,

3430

flags,

3434

flags,

3431

(baserev, delta, delta_base_reuse_policy),

3435

(baserev, delta, delta_base_reuse_policy),

3432

alwayscache=alwayscache,

3436

alwayscache=alwayscache,

3433

deltacomputer=deltacomputer,

3437

deltacomputer=deltacomputer,

3434

sidedata=sidedata,

3438

sidedata=sidedata,

3435

)

3439

)

3436

3440

3437

if addrevisioncb:

3441

if addrevisioncb:

3438

addrevisioncb(self, rev)

3442

addrevisioncb(self, rev)

3439

empty = False

3443

empty = False

3440

finally:

3444

finally:

3441

self._adding_group = False

3445

self._adding_group = False

3442

return not empty

3446

return not empty

3443

3447

3444

def iscensored(self, rev):

3448

def iscensored(self, rev):

3445

"""Check if a file revision is censored."""

3449

"""Check if a file revision is censored."""

3446

if not self.feature_config.censorable:

3450

if not self.feature_config.censorable:

3447

return False

3451

return False

3448

3452

3449

return self.flags(rev) & REVIDX_ISCENSORED

3453

return self.flags(rev) & REVIDX_ISCENSORED

3450

3454

3451

def _peek_iscensored(self, baserev, delta):

3455

def _peek_iscensored(self, baserev, delta):

3452

"""Quickly check if a delta produces a censored revision."""

3456

"""Quickly check if a delta produces a censored revision."""

3453

if not self.feature_config.censorable:

3457

if not self.feature_config.censorable:

3454

return False

3458

return False

3455

3459

3456

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3460

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3457

3461

3458

def getstrippoint(self, minlink):

3462

def getstrippoint(self, minlink):

3459

"""find the minimum rev that must be stripped to strip the linkrev

3463

"""find the minimum rev that must be stripped to strip the linkrev

3460

3464

3461

Returns a tuple containing the minimum rev and a set of all revs that

3465

Returns a tuple containing the minimum rev and a set of all revs that

3462

have linkrevs that will be broken by this strip.

3466

have linkrevs that will be broken by this strip.

3463

"""

3467

"""

3464

return storageutil.resolvestripinfo(

3468

return storageutil.resolvestripinfo(

3465

minlink,

3469

minlink,

3466

len(self) - 1,

3470

len(self) - 1,

3467

self.headrevs(),

3471

self.headrevs(),

3468

self.linkrev,

3472

self.linkrev,

3469

self.parentrevs,

3473

self.parentrevs,

3470

)

3474

)

3471

3475

3472

def strip(self, minlink, transaction):

3476

def strip(self, minlink, transaction):

3473

"""truncate the revlog on the first revision with a linkrev >= minlink

3477

"""truncate the revlog on the first revision with a linkrev >= minlink

3474

3478

3475

This function is called when we're stripping revision minlink and

3479

This function is called when we're stripping revision minlink and

3476

its descendants from the repository.

3480

its descendants from the repository.

3477

3481

3478

We have to remove all revisions with linkrev >= minlink, because

3482

We have to remove all revisions with linkrev >= minlink, because

3479

the equivalent changelog revisions will be renumbered after the

3483

the equivalent changelog revisions will be renumbered after the

3480

strip.

3484

strip.

3481

3485

3482

So we truncate the revlog on the first of these revisions, and

3486

So we truncate the revlog on the first of these revisions, and

3483

trust that the caller has saved the revisions that shouldn't be

3487

trust that the caller has saved the revisions that shouldn't be

3484

removed and that it'll re-add them after this truncation.

3488

removed and that it'll re-add them after this truncation.

3485

"""

3489

"""

3486

if len(self) == 0:

3490

if len(self) == 0:

3487

return

3491

return

3488

3492

3489

rev, _ = self.getstrippoint(minlink)

3493

rev, _ = self.getstrippoint(minlink)

3490

if rev == len(self):

3494

if rev == len(self):

3491

return

3495

return

3492

3496

3493

# first truncate the files on disk

3497

# first truncate the files on disk

3494

data_end = self.start(rev)

3498

data_end = self.start(rev)

3495

if not self._inline:

3499

if not self._inline:

3496

transaction.add(self._datafile, data_end)

3500

transaction.add(self._datafile, data_end)

3497

end = rev * self.index.entry_size

3501

end = rev * self.index.entry_size

3498

else:

3502

else:

3499

end = data_end + (rev * self.index.entry_size)

3503

end = data_end + (rev * self.index.entry_size)

3500

3504

3501

if self._sidedatafile:

3505

if self._sidedatafile:

3502

sidedata_end = self.sidedata_cut_off(rev)

3506

sidedata_end = self.sidedata_cut_off(rev)

3503

transaction.add(self._sidedatafile, sidedata_end)

3507

transaction.add(self._sidedatafile, sidedata_end)

3504

3508

3505

transaction.add(self._indexfile, end)

3509

transaction.add(self._indexfile, end)

3506

if self._docket is not None:

3510

if self._docket is not None:

3507

# XXX we could, leverage the docket while stripping. However it is

3511

# XXX we could, leverage the docket while stripping. However it is

3508

# not powerfull enough at the time of this comment

3512

# not powerfull enough at the time of this comment

3509

self._docket.index_end = end

3513

self._docket.index_end = end

3510

self._docket.data_end = data_end

3514

self._docket.data_end = data_end

3511

self._docket.sidedata_end = sidedata_end

3515

self._docket.sidedata_end = sidedata_end

3512

self._docket.write(transaction, stripping=True)

3516

self._docket.write(transaction, stripping=True)

3513

3517

3514

# then reset internal state in memory to forget those revisions

3518

# then reset internal state in memory to forget those revisions

3515

self._chaininfocache = util.lrucachedict(500)

3519

self._chaininfocache = util.lrucachedict(500)

3516

self._inner.clear_cache()

3520

self._inner.clear_cache()

3517

3521

3518

del self.index[rev:-1]

3522

del self.index[rev:-1]

3519

3523

3520

def checksize(self):

3524

def checksize(self):

3521

"""Check size of index and data files

3525

"""Check size of index and data files

3522

3526

3523

return a (dd, di) tuple.

3527

return a (dd, di) tuple.

3524

- dd: extra bytes for the "data" file

3528

- dd: extra bytes for the "data" file

3525

- di: extra bytes for the "index" file

3529

- di: extra bytes for the "index" file

3526

3530

3527

A healthy revlog will return (0, 0).

3531

A healthy revlog will return (0, 0).

3528

"""

3532

"""

3529

expected = 0

3533

expected = 0

3530

if len(self):

3534

if len(self):

3531

expected = max(0, self.end(len(self) - 1))

3535

expected = max(0, self.end(len(self) - 1))

3532

3536

3533

try:

3537

try:

3534

with self._datafp() as f:

3538

with self._datafp() as f:

3535

f.seek(0, io.SEEK_END)

3539

f.seek(0, io.SEEK_END)

3536

actual = f.tell()

3540

actual = f.tell()

3537

dd = actual - expected

3541

dd = actual - expected

3538

except FileNotFoundError:

3542

except FileNotFoundError:

3539

dd = 0

3543

dd = 0

3540

3544

3541

try:

3545

try:

3542

f = self.opener(self._indexfile)

3546

f = self.opener(self._indexfile)

3543

f.seek(0, io.SEEK_END)

3547

f.seek(0, io.SEEK_END)

3544

actual = f.tell()

3548

actual = f.tell()

3545

f.close()

3549

f.close()

3546

s = self.index.entry_size

3550

s = self.index.entry_size

3547

i = max(0, actual // s)

3551

i = max(0, actual // s)

3548

di = actual - (i * s)

3552

di = actual - (i * s)

3549

if self._inline:

3553

if self._inline:

3550

databytes = 0

3554

databytes = 0

3551

for r in self:

3555

for r in self:

3552

databytes += max(0, self.length(r))

3556

databytes += max(0, self.length(r))

3553

dd = 0

3557

dd = 0

3554

di = actual - len(self) * s - databytes

3558

di = actual - len(self) * s - databytes

3555

except FileNotFoundError:

3559

except FileNotFoundError:

3556

di = 0

3560

di = 0

3557

3561

3558

return (dd, di)

3562

return (dd, di)

3559

3563

3560

def files(self):

3564

def files(self):

3561

"""return list of files that compose this revlog"""

3565

"""return list of files that compose this revlog"""

3562

res = [self._indexfile]

3566

res = [self._indexfile]

3563

if self._docket_file is None:

3567

if self._docket_file is None:

3564

if not self._inline:

3568

if not self._inline:

3565

res.append(self._datafile)

3569

res.append(self._datafile)

3566

else:

3570

else:

3567

res.append(self._docket_file)

3571

res.append(self._docket_file)

3568

res.extend(self._docket.old_index_filepaths(include_empty=False))

3572

res.extend(self._docket.old_index_filepaths(include_empty=False))

3569

if self._docket.data_end:

3573

if self._docket.data_end:

3570

res.append(self._datafile)

3574

res.append(self._datafile)

3571

res.extend(self._docket.old_data_filepaths(include_empty=False))

3575

res.extend(self._docket.old_data_filepaths(include_empty=False))

3572

if self._docket.sidedata_end:

3576

if self._docket.sidedata_end:

3573

res.append(self._sidedatafile)

3577

res.append(self._sidedatafile)

3574

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3578

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3575

return res

3579

return res

3576

3580

3577

def emitrevisions(

3581

def emitrevisions(

3578

self,

3582

self,

3579

nodes,

3583

nodes,

3580

nodesorder=None,

3584

nodesorder=None,

3581

revisiondata=False,

3585

revisiondata=False,

3582

assumehaveparentrevisions=False,

3586

assumehaveparentrevisions=False,

3583

deltamode=repository.CG_DELTAMODE_STD,

3587

deltamode=repository.CG_DELTAMODE_STD,

3584

sidedata_helpers=None,

3588

sidedata_helpers=None,

3585

debug_info=None,

3589

debug_info=None,

3586

):

3590

):

3587

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3591

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3588

raise error.ProgrammingError(

3592

raise error.ProgrammingError(

3589

b'unhandled value for nodesorder: %s' % nodesorder

3593

b'unhandled value for nodesorder: %s' % nodesorder

3590

)

3594

)

3591

3595

3592

if nodesorder is None and not self.delta_config.general_delta:

3596

if nodesorder is None and not self.delta_config.general_delta:

3593

nodesorder = b'storage'

3597

nodesorder = b'storage'

3594

3598

3595

if (

3599

if (

3596

not self._storedeltachains

3600

not self._storedeltachains

3597

and deltamode != repository.CG_DELTAMODE_PREV

3601

and deltamode != repository.CG_DELTAMODE_PREV

3598

):

3602

):

3599

deltamode = repository.CG_DELTAMODE_FULL

3603

deltamode = repository.CG_DELTAMODE_FULL

3600

3604

3601

return storageutil.emitrevisions(

3605

return storageutil.emitrevisions(

3602

self,

3606

self,

3603

nodes,

3607

nodes,

3604

nodesorder,

3608

nodesorder,

3605

revlogrevisiondelta,

3609

revlogrevisiondelta,

3606

deltaparentfn=self.deltaparent,

3610

deltaparentfn=self.deltaparent,

3607

candeltafn=self._candelta,

3611

candeltafn=self._candelta,

3608

rawsizefn=self.rawsize,

3612

rawsizefn=self.rawsize,

3609

revdifffn=self.revdiff,

3613

revdifffn=self.revdiff,

3610

flagsfn=self.flags,

3614

flagsfn=self.flags,

3611

deltamode=deltamode,

3615

deltamode=deltamode,

3612

revisiondata=revisiondata,

3616

revisiondata=revisiondata,

3613

assumehaveparentrevisions=assumehaveparentrevisions,

3617

assumehaveparentrevisions=assumehaveparentrevisions,

3614

sidedata_helpers=sidedata_helpers,

3618

sidedata_helpers=sidedata_helpers,

3615

debug_info=debug_info,

3619

debug_info=debug_info,

3616

)

3620

)

3617

3621

3618

DELTAREUSEALWAYS = b'always'

3622

DELTAREUSEALWAYS = b'always'

3619

DELTAREUSESAMEREVS = b'samerevs'

3623

DELTAREUSESAMEREVS = b'samerevs'

3620

DELTAREUSENEVER = b'never'

3624

DELTAREUSENEVER = b'never'

3621

3625

3622

DELTAREUSEFULLADD = b'fulladd'

3626

DELTAREUSEFULLADD = b'fulladd'

3623

3627

3624

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3628

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3625

3629

3626

def clone(

3630

def clone(

3627

self,

3631

self,

3628

tr,

3632

tr,

3629

destrevlog,

3633

destrevlog,

3630

addrevisioncb=None,

3634

addrevisioncb=None,

3631

deltareuse=DELTAREUSESAMEREVS,

3635

deltareuse=DELTAREUSESAMEREVS,

3632

forcedeltabothparents=None,

3636

forcedeltabothparents=None,

3633

sidedata_helpers=None,

3637

sidedata_helpers=None,

3634

):

3638

):

3635

"""Copy this revlog to another, possibly with format changes.

3639

"""Copy this revlog to another, possibly with format changes.

3636

3640

3637

The destination revlog will contain the same revisions and nodes.

3641

The destination revlog will contain the same revisions and nodes.

3638

However, it may not be bit-for-bit identical due to e.g. delta encoding

3642

However, it may not be bit-for-bit identical due to e.g. delta encoding

3639

differences.

3643

differences.

3640

3644

3641

The ``deltareuse`` argument control how deltas from the existing revlog

3645

The ``deltareuse`` argument control how deltas from the existing revlog

3642

are preserved in the destination revlog. The argument can have the

3646

are preserved in the destination revlog. The argument can have the

3643

following values:

3647

following values:

3644

3648

3645

DELTAREUSEALWAYS

3649

DELTAREUSEALWAYS

3646

Deltas will always be reused (if possible), even if the destination

3650

Deltas will always be reused (if possible), even if the destination

3647

revlog would not select the same revisions for the delta. This is the

3651

revlog would not select the same revisions for the delta. This is the

3648

fastest mode of operation.

3652

fastest mode of operation.

3649

DELTAREUSESAMEREVS

3653

DELTAREUSESAMEREVS

3650

Deltas will be reused if the destination revlog would pick the same

3654

Deltas will be reused if the destination revlog would pick the same

3651

revisions for the delta. This mode strikes a balance between speed

3655

revisions for the delta. This mode strikes a balance between speed

3652

and optimization.

3656

and optimization.

3653

DELTAREUSENEVER

3657

DELTAREUSENEVER

3654

Deltas will never be reused. This is the slowest mode of execution.

3658

Deltas will never be reused. This is the slowest mode of execution.

3655

This mode can be used to recompute deltas (e.g. if the diff/delta

3659

This mode can be used to recompute deltas (e.g. if the diff/delta

3656

algorithm changes).

3660

algorithm changes).

3657

DELTAREUSEFULLADD

3661

DELTAREUSEFULLADD

3658

Revision will be re-added as if their were new content. This is

3662

Revision will be re-added as if their were new content. This is

3659

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3663

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3660

eg: large file detection and handling.

3664

eg: large file detection and handling.

3661

3665

3662

Delta computation can be slow, so the choice of delta reuse policy can

3666

Delta computation can be slow, so the choice of delta reuse policy can

3663

significantly affect run time.

3667

significantly affect run time.

3664

3668

3665

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3669

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3666

two extremes. Deltas will be reused if they are appropriate. But if the

3670

two extremes. Deltas will be reused if they are appropriate. But if the

3667

delta could choose a better revision, it will do so. This means if you

3671

delta could choose a better revision, it will do so. This means if you

3668

are converting a non-generaldelta revlog to a generaldelta revlog,

3672

are converting a non-generaldelta revlog to a generaldelta revlog,

3669

deltas will be recomputed if the delta's parent isn't a parent of the

3673

deltas will be recomputed if the delta's parent isn't a parent of the

3670

revision.

3674

revision.

3671

3675

3672

In addition to the delta policy, the ``forcedeltabothparents``

3676

In addition to the delta policy, the ``forcedeltabothparents``

3673

argument controls whether to force compute deltas against both parents

3677

argument controls whether to force compute deltas against both parents

3674

for merges. By default, the current default is used.

3678

for merges. By default, the current default is used.

3675

3679

3676

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3680

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3677

`sidedata_helpers`.

3681

`sidedata_helpers`.

3678

"""

3682

"""

3679

if deltareuse not in self.DELTAREUSEALL:

3683

if deltareuse not in self.DELTAREUSEALL:

3680

raise ValueError(

3684

raise ValueError(

3681

_(b'value for deltareuse invalid: %s') % deltareuse

3685

_(b'value for deltareuse invalid: %s') % deltareuse

3682

)

3686

)

3683

3687

3684

if len(destrevlog):

3688

if len(destrevlog):

3685

raise ValueError(_(b'destination revlog is not empty'))

3689

raise ValueError(_(b'destination revlog is not empty'))

3686

3690

3687

if getattr(self, 'filteredrevs', None):

3691

if getattr(self, 'filteredrevs', None):

3688

raise ValueError(_(b'source revlog has filtered revisions'))

3692

raise ValueError(_(b'source revlog has filtered revisions'))

3689

if getattr(destrevlog, 'filteredrevs', None):

3693

if getattr(destrevlog, 'filteredrevs', None):

3690

raise ValueError(_(b'destination revlog has filtered revisions'))

3694

raise ValueError(_(b'destination revlog has filtered revisions'))

3691

3695

3692

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3696

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3693

# if possible.

3697

# if possible.

3694

old_delta_config = destrevlog.delta_config

3698

old_delta_config = destrevlog.delta_config

3695

destrevlog.delta_config = destrevlog.delta_config.copy()

3699

destrevlog.delta_config = destrevlog.delta_config.copy()

3696

3700

3697

try:

3701

try:

3698

if deltareuse == self.DELTAREUSEALWAYS:

3702

if deltareuse == self.DELTAREUSEALWAYS:

3699

destrevlog.delta_config.lazy_delta_base = True

3703

destrevlog.delta_config.lazy_delta_base = True

3700

destrevlog.delta_config.lazy_delta = True

3704

destrevlog.delta_config.lazy_delta = True

3701

elif deltareuse == self.DELTAREUSESAMEREVS:

3705

elif deltareuse == self.DELTAREUSESAMEREVS:

3702

destrevlog.delta_config.lazy_delta_base = False

3706

destrevlog.delta_config.lazy_delta_base = False

3703

destrevlog.delta_config.lazy_delta = True

3707

destrevlog.delta_config.lazy_delta = True

3704

elif deltareuse == self.DELTAREUSENEVER:

3708

elif deltareuse == self.DELTAREUSENEVER:

3705

destrevlog.delta_config.lazy_delta_base = False

3709

destrevlog.delta_config.lazy_delta_base = False

3706

destrevlog.delta_config.lazy_delta = False

3710

destrevlog.delta_config.lazy_delta = False

3707

3711

3708

delta_both_parents = (

3712

delta_both_parents = (

3709

forcedeltabothparents or old_delta_config.delta_both_parents

3713

forcedeltabothparents or old_delta_config.delta_both_parents

3710

)

3714

)

3711

destrevlog.delta_config.delta_both_parents = delta_both_parents

3715

destrevlog.delta_config.delta_both_parents = delta_both_parents

3712

3716

3713

with self.reading(), destrevlog._writing(tr):

3717

with self.reading(), destrevlog._writing(tr):

3714

self._clone(

3718

self._clone(

3715

tr,

3719

tr,

3716

destrevlog,

3720

destrevlog,

3717

addrevisioncb,

3721

addrevisioncb,

3718

deltareuse,

3722

deltareuse,

3719

forcedeltabothparents,

3723

forcedeltabothparents,

3720

sidedata_helpers,

3724

sidedata_helpers,

3721

)

3725

)

3722

3726

3723

finally:

3727

finally:

3724

destrevlog.delta_config = old_delta_config

3728

destrevlog.delta_config = old_delta_config

3725

3729

3726

def _clone(

3730

def _clone(

3727

self,

3731

self,

3728

tr,

3732

tr,

3729

destrevlog,

3733

destrevlog,

3730

addrevisioncb,

3734

addrevisioncb,

3731

deltareuse,

3735

deltareuse,

3732

forcedeltabothparents,

3736

forcedeltabothparents,

3733

sidedata_helpers,

3737

sidedata_helpers,

3734

):

3738

):

3735

"""perform the core duty of `revlog.clone` after parameter processing"""

3739

"""perform the core duty of `revlog.clone` after parameter processing"""

3736

write_debug = None

3740

write_debug = None

3737

if self.delta_config.debug_delta:

3741

if self.delta_config.debug_delta:

3738

write_debug = tr._report

3742

write_debug = tr._report

3739

deltacomputer = deltautil.deltacomputer(

3743

deltacomputer = deltautil.deltacomputer(

3740

destrevlog,

3744

destrevlog,

3741

write_debug=write_debug,

3745

write_debug=write_debug,

3742

)

3746

)

3743

index = self.index

3747

index = self.index

3744

for rev in self:

3748

for rev in self:

3745

entry = index[rev]

3749

entry = index[rev]

3746

3750

3747

# Some classes override linkrev to take filtered revs into

3751

# Some classes override linkrev to take filtered revs into

3748

# account. Use raw entry from index.

3752

# account. Use raw entry from index.

3749

flags = entry[0] & 0xFFFF

3753

flags = entry[0] & 0xFFFF

3750

linkrev = entry[4]

3754

linkrev = entry[4]

3751

p1 = index[entry[5]][7]

3755

p1 = index[entry[5]][7]

3752

p2 = index[entry[6]][7]

3756

p2 = index[entry[6]][7]

3753

node = entry[7]

3757

node = entry[7]

3754

3758

3755

# (Possibly) reuse the delta from the revlog if allowed and

3759

# (Possibly) reuse the delta from the revlog if allowed and

3756

# the revlog chunk is a delta.

3760

# the revlog chunk is a delta.

3757

cachedelta = None

3761

cachedelta = None

3758

rawtext = None

3762

rawtext = None

3759

if deltareuse == self.DELTAREUSEFULLADD:

3763

if deltareuse == self.DELTAREUSEFULLADD:

3760

text = self._revisiondata(rev)

3764

text = self._revisiondata(rev)

3761

sidedata = self.sidedata(rev)

3765

sidedata = self.sidedata(rev)

3762

3766

3763

if sidedata_helpers is not None:

3767

if sidedata_helpers is not None:

3764

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3768

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3765

self, sidedata_helpers, sidedata, rev

3769

self, sidedata_helpers, sidedata, rev

3766

)

3770

)

3767

flags = flags | new_flags[0] & ~new_flags[1]

3771

flags = flags | new_flags[0] & ~new_flags[1]

3768

3772

3769

destrevlog.addrevision(

3773

destrevlog.addrevision(

3770

text,

3774

text,

3771

tr,

3775

tr,

3772

linkrev,

3776

linkrev,

3773

p1,

3777

p1,

3774

p2,

3778

p2,

3775

cachedelta=cachedelta,

3779

cachedelta=cachedelta,

3776

node=node,

3780

node=node,

3777

flags=flags,

3781

flags=flags,

3778

deltacomputer=deltacomputer,

3782

deltacomputer=deltacomputer,

3779

sidedata=sidedata,

3783

sidedata=sidedata,

3780

)

3784

)

3781

else:

3785

else:

3782

if destrevlog.delta_config.lazy_delta:

3786

if destrevlog.delta_config.lazy_delta:

3783

dp = self.deltaparent(rev)

3787

dp = self.deltaparent(rev)

3784

if dp != nullrev:

3788

if dp != nullrev:

3785

cachedelta = (dp, bytes(self._inner._chunk(rev)))

3789

cachedelta = (dp, bytes(self._inner._chunk(rev)))

3786

3790

3787

sidedata = None

3791

sidedata = None

3788

if not cachedelta:

3792

if not cachedelta:

3789

try:

3793

try:

3790

rawtext = self._revisiondata(rev)

3794

rawtext = self._revisiondata(rev)

3791

except error.CensoredNodeError as censored:

3795

except error.CensoredNodeError as censored:

3792

assert flags & REVIDX_ISCENSORED

3796

assert flags & REVIDX_ISCENSORED

3793

rawtext = censored.tombstone

3797

rawtext = censored.tombstone

3794

sidedata = self.sidedata(rev)

3798

sidedata = self.sidedata(rev)

3795

if sidedata is None:

3799

if sidedata is None:

3796

sidedata = self.sidedata(rev)

3800

sidedata = self.sidedata(rev)

3797

3801

3798

if sidedata_helpers is not None:

3802

if sidedata_helpers is not None:

3799

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3803

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3800

self, sidedata_helpers, sidedata, rev

3804

self, sidedata_helpers, sidedata, rev

3801

)

3805

)

3802

flags = flags | new_flags[0] & ~new_flags[1]

3806

flags = flags | new_flags[0] & ~new_flags[1]

3803

3807

3804

destrevlog._addrevision(

3808

destrevlog._addrevision(

3805

node,

3809

node,

3806

rawtext,

3810

rawtext,

3807

tr,

3811

tr,

3808

linkrev,

3812

linkrev,

3809

p1,

3813

p1,

3810

p2,

3814

p2,

3811

flags,

3815

flags,

3812

cachedelta,

3816

cachedelta,

3813

deltacomputer=deltacomputer,

3817

deltacomputer=deltacomputer,

3814

sidedata=sidedata,

3818

sidedata=sidedata,

3815

)

3819

)

3816

3820

3817

if addrevisioncb:

3821

if addrevisioncb:

3818

addrevisioncb(self, rev, node)

3822

addrevisioncb(self, rev, node)

3819

3823

3820

def censorrevision(self, tr, censornode, tombstone=b''):

3824

def censorrevision(self, tr, censornode, tombstone=b''):

3821

if self._format_version == REVLOGV0:

3825

if self._format_version == REVLOGV0:

3822

raise error.RevlogError(

3826

raise error.RevlogError(

3823

_(b'cannot censor with version %d revlogs')

3827

_(b'cannot censor with version %d revlogs')

3824

% self._format_version

3828

% self._format_version

3825

)

3829

)

3826

elif self._format_version == REVLOGV1:

3830

elif self._format_version == REVLOGV1:

3827

rewrite.v1_censor(self, tr, censornode, tombstone)

3831

rewrite.v1_censor(self, tr, censornode, tombstone)

3828

else:

3832

else:

3829

rewrite.v2_censor(self, tr, censornode, tombstone)

3833

rewrite.v2_censor(self, tr, censornode, tombstone)

3830

3834

3831

def verifyintegrity(self, state):

3835

def verifyintegrity(self, state):

3832

"""Verifies the integrity of the revlog.

3836

"""Verifies the integrity of the revlog.

3833

3837

3834

Yields ``revlogproblem`` instances describing problems that are

3838

Yields ``revlogproblem`` instances describing problems that are

3835

found.

3839

found.

3836

"""

3840

"""

3837

dd, di = self.checksize()

3841

dd, di = self.checksize()

3838

if dd:

3842

if dd:

3839

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3843

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3840

if di:

3844

if di:

3841

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3845

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3842

3846

3843

version = self._format_version

3847

version = self._format_version

3844

3848

3845

# The verifier tells us what version revlog we should be.

3849

# The verifier tells us what version revlog we should be.

3846

if version != state[b'expectedversion']:

3850

if version != state[b'expectedversion']:

3847

yield revlogproblem(

3851

yield revlogproblem(

3848

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3852

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3849

% (self.display_id, version, state[b'expectedversion'])

3853

% (self.display_id, version, state[b'expectedversion'])

3850

)

3854

)

3851

3855

3852

state[b'skipread'] = set()

3856

state[b'skipread'] = set()

3853

state[b'safe_renamed'] = set()

3857

state[b'safe_renamed'] = set()

3854

3858

3855

for rev in self:

3859

for rev in self:

3856

node = self.node(rev)

3860

node = self.node(rev)

3857

3861

3858

# Verify contents. 4 cases to care about:

3862

# Verify contents. 4 cases to care about:

3859

#

3863

#

3860

# common: the most common case

3864

# common: the most common case

3861

# rename: with a rename

3865

# rename: with a rename

3862

# meta: file content starts with b'\1\n', the metadata

3866

# meta: file content starts with b'\1\n', the metadata

3863

# header defined in filelog.py, but without a rename

3867

# header defined in filelog.py, but without a rename

3864

# ext: content stored externally

3868

# ext: content stored externally

3865

#

3869

#

3866

# More formally, their differences are shown below:

3870

# More formally, their differences are shown below:

3867

#

3871

#

3868

# | common | rename | meta | ext

3872

# | common | rename | meta | ext

3869

# -------------------------------------------------------

3873

# -------------------------------------------------------

3870

# flags() | 0 | 0 | 0 | not 0

3874

# flags() | 0 | 0 | 0 | not 0

3871

# renamed() | False | True | False | ?

3875

# renamed() | False | True | False | ?

3872

# rawtext[0:2]=='\1\n'| False | True | True | ?

3876

# rawtext[0:2]=='\1\n'| False | True | True | ?

3873

#

3877

#

3874

# "rawtext" means the raw text stored in revlog data, which

3878

# "rawtext" means the raw text stored in revlog data, which

3875

# could be retrieved by "rawdata(rev)". "text"

3879

# could be retrieved by "rawdata(rev)". "text"

3876

# mentioned below is "revision(rev)".

3880

# mentioned below is "revision(rev)".

3877

#

3881

#

3878

# There are 3 different lengths stored physically:

3882

# There are 3 different lengths stored physically:

3879

# 1. L1: rawsize, stored in revlog index

3883

# 1. L1: rawsize, stored in revlog index

3880

# 2. L2: len(rawtext), stored in revlog data

3884

# 2. L2: len(rawtext), stored in revlog data

3881

# 3. L3: len(text), stored in revlog data if flags==0, or

3885

# 3. L3: len(text), stored in revlog data if flags==0, or

3882

# possibly somewhere else if flags!=0

3886

# possibly somewhere else if flags!=0

3883

#

3887

#

3884

# L1 should be equal to L2. L3 could be different from them.

3888

# L1 should be equal to L2. L3 could be different from them.

3885

# "text" may or may not affect commit hash depending on flag

3889

# "text" may or may not affect commit hash depending on flag

3886

# processors (see flagutil.addflagprocessor).

3890

# processors (see flagutil.addflagprocessor).

3887

#

3891

#

3888

# | common | rename | meta | ext

3892

# | common | rename | meta | ext

3889

# -------------------------------------------------

3893

# -------------------------------------------------

3890

# rawsize() | L1 | L1 | L1 | L1

3894

# rawsize() | L1 | L1 | L1 | L1

3891

# size() | L1 | L2-LM | L1(*) | L1 (?)

3895

# size() | L1 | L2-LM | L1(*) | L1 (?)

3892

# len(rawtext) | L2 | L2 | L2 | L2

3896

# len(rawtext) | L2 | L2 | L2 | L2

3893

# len(text) | L2 | L2 | L2 | L3

3897

# len(text) | L2 | L2 | L2 | L3

3894

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3898

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3895

#

3899

#

3896

# LM: length of metadata, depending on rawtext

3900

# LM: length of metadata, depending on rawtext

3897

# (*): not ideal, see comment in filelog.size

3901

# (*): not ideal, see comment in filelog.size

3898

# (?): could be "- len(meta)" if the resolved content has

3902

# (?): could be "- len(meta)" if the resolved content has

3899

# rename metadata

3903

# rename metadata

3900

#

3904

#

3901

# Checks needed to be done:

3905

# Checks needed to be done:

3902

# 1. length check: L1 == L2, in all cases.

3906

# 1. length check: L1 == L2, in all cases.

3903

# 2. hash check: depending on flag processor, we may need to

3907

# 2. hash check: depending on flag processor, we may need to

3904

# use either "text" (external), or "rawtext" (in revlog).

3908

# use either "text" (external), or "rawtext" (in revlog).

3905

3909

3906

try:

3910

try:

3907

skipflags = state.get(b'skipflags', 0)

3911

skipflags = state.get(b'skipflags', 0)

3908

if skipflags:

3912

if skipflags:

3909

skipflags &= self.flags(rev)

3913

skipflags &= self.flags(rev)

3910

3914

3911

_verify_revision(self, skipflags, state, node)

3915

_verify_revision(self, skipflags, state, node)

3912

3916

3913

l1 = self.rawsize(rev)

3917

l1 = self.rawsize(rev)

3914

l2 = len(self.rawdata(node))

3918

l2 = len(self.rawdata(node))

3915

3919

3916

if l1 != l2:

3920

if l1 != l2:

3917

yield revlogproblem(

3921

yield revlogproblem(

3918

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3922

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3919

node=node,

3923

node=node,

3920

)

3924

)

3921

3925

3922

except error.CensoredNodeError:

3926

except error.CensoredNodeError:

3923

if state[b'erroroncensored']:

3927

if state[b'erroroncensored']:

3924

yield revlogproblem(

3928

yield revlogproblem(

3925

error=_(b'censored file data'), node=node

3929

error=_(b'censored file data'), node=node

3926

)

3930

)

3927

state[b'skipread'].add(node)

3931

state[b'skipread'].add(node)

3928

except Exception as e:

3932

except Exception as e:

3929

yield revlogproblem(

3933

yield revlogproblem(

3930

error=_(b'unpacking %s: %s')

3934

error=_(b'unpacking %s: %s')

3931

% (short(node), stringutil.forcebytestr(e)),

3935

% (short(node), stringutil.forcebytestr(e)),

3932

node=node,

3936

node=node,

3933

)

3937

)

3934

state[b'skipread'].add(node)

3938

state[b'skipread'].add(node)

3935

3939

3936

def storageinfo(

3940

def storageinfo(

3937

self,

3941

self,

3938

exclusivefiles=False,

3942

exclusivefiles=False,

3939

sharedfiles=False,

3943

sharedfiles=False,

3940

revisionscount=False,

3944

revisionscount=False,

3941

trackedsize=False,

3945

trackedsize=False,

3942

storedsize=False,

3946

storedsize=False,

3943

):

3947

):

3944

d = {}

3948

d = {}

3945

3949

3946

if exclusivefiles:

3950

if exclusivefiles:

3947

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3951

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3948

if not self._inline:

3952

if not self._inline:

3949

d[b'exclusivefiles'].append((self.opener, self._datafile))

3953

d[b'exclusivefiles'].append((self.opener, self._datafile))

3950

3954

3951

if sharedfiles:

3955

if sharedfiles:

3952

d[b'sharedfiles'] = []

3956

d[b'sharedfiles'] = []

3953

3957

3954

if revisionscount:

3958

if revisionscount:

3955

d[b'revisionscount'] = len(self)

3959

d[b'revisionscount'] = len(self)

3956

3960

3957

if trackedsize:

3961

if trackedsize:

3958

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3962

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3959

3963

3960

if storedsize:

3964

if storedsize:

3961

d[b'storedsize'] = sum(

3965

d[b'storedsize'] = sum(

3962

self.opener.stat(path).st_size for path in self.files()

3966

self.opener.stat(path).st_size for path in self.files()

3963

)

3967

)

3964

3968

3965

return d

3969

return d

3966

3970

3967

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3971

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3968

if not self.feature_config.has_side_data:

3972

if not self.feature_config.has_side_data:

3969

return

3973

return

3970

# revlog formats with sidedata support does not support inline

3974

# revlog formats with sidedata support does not support inline

3971

assert not self._inline

3975

assert not self._inline

3972

if not helpers[1] and not helpers[2]:

3976

if not helpers[1] and not helpers[2]:

3973

# Nothing to generate or remove

3977

# Nothing to generate or remove

3974

return

3978

return

3975

3979

3976

new_entries = []

3980

new_entries = []

3977

# append the new sidedata

3981

# append the new sidedata

3978

with self._writing(transaction):

3982

with self._writing(transaction):

3979

ifh, dfh, sdfh = self._inner._writinghandles

3983

ifh, dfh, sdfh = self._inner._writinghandles

3980

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3984

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3981

3985

3982

current_offset = sdfh.tell()

3986

current_offset = sdfh.tell()

3983

for rev in range(startrev, endrev + 1):

3987

for rev in range(startrev, endrev + 1):

3984

entry = self.index[rev]

3988

entry = self.index[rev]

3985

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

3989

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

3986

store=self,

3990

store=self,

3987

sidedata_helpers=helpers,

3991

sidedata_helpers=helpers,

3988

sidedata={},

3992

sidedata={},

3989

rev=rev,

3993

rev=rev,

3990

)

3994

)

3991

3995

3992

serialized_sidedata = sidedatautil.serialize_sidedata(

3996

serialized_sidedata = sidedatautil.serialize_sidedata(

3993

new_sidedata

3997

new_sidedata

3994

)

3998

)

3995

3999

3996

sidedata_compression_mode = COMP_MODE_INLINE

4000

sidedata_compression_mode = COMP_MODE_INLINE

3997

if serialized_sidedata and self.feature_config.has_side_data:

4001

if serialized_sidedata and self.feature_config.has_side_data:

3998

sidedata_compression_mode = COMP_MODE_PLAIN

4002

sidedata_compression_mode = COMP_MODE_PLAIN

3999

h, comp_sidedata = self._inner.compress(serialized_sidedata)

4003

h, comp_sidedata = self._inner.compress(serialized_sidedata)

4000

if (

4004

if (

4001

h != b'u'

4005

h != b'u'

4002

and comp_sidedata[0] != b'\0'

4006

and comp_sidedata[0] != b'\0'

4003

and len(comp_sidedata) < len(serialized_sidedata)

4007

and len(comp_sidedata) < len(serialized_sidedata)

4004

):

4008

):

4005

assert not h

4009

assert not h

4006

if (

4010

if (

4007

comp_sidedata[0]

4011

comp_sidedata[0]

4008

== self._docket.default_compression_header

4012

== self._docket.default_compression_header

4009

):

4013

):

4010

sidedata_compression_mode = COMP_MODE_DEFAULT

4014

sidedata_compression_mode = COMP_MODE_DEFAULT

4011

serialized_sidedata = comp_sidedata

4015

serialized_sidedata = comp_sidedata

4012

else:

4016

else:

4013

sidedata_compression_mode = COMP_MODE_INLINE

4017

sidedata_compression_mode = COMP_MODE_INLINE

4014

serialized_sidedata = comp_sidedata

4018

serialized_sidedata = comp_sidedata

4015

if entry[8] != 0 or entry[9] != 0:

4019

if entry[8] != 0 or entry[9] != 0:

4016

# rewriting entries that already have sidedata is not

4020

# rewriting entries that already have sidedata is not

4017

# supported yet, because it introduces garbage data in the

4021

# supported yet, because it introduces garbage data in the

4018

# revlog.

4022

# revlog.

4019

msg = b"rewriting existing sidedata is not supported yet"

4023

msg = b"rewriting existing sidedata is not supported yet"

4020

raise error.Abort(msg)

4024

raise error.Abort(msg)

4021

4025

4022

# Apply (potential) flags to add and to remove after running

4026

# Apply (potential) flags to add and to remove after running

4023

# the sidedata helpers

4027

# the sidedata helpers

4024

new_offset_flags = entry[0] | flags[0] & ~flags[1]

4028

new_offset_flags = entry[0] | flags[0] & ~flags[1]

4025

entry_update = (

4029

entry_update = (

4026

current_offset,

4030

current_offset,

4027

len(serialized_sidedata),

4031

len(serialized_sidedata),

4028

new_offset_flags,

4032

new_offset_flags,

4029

sidedata_compression_mode,

4033

sidedata_compression_mode,

4030

)

4034

)

4031

4035

4032

# the sidedata computation might have move the file cursors around

4036

# the sidedata computation might have move the file cursors around

4033

sdfh.seek(current_offset, os.SEEK_SET)

4037

sdfh.seek(current_offset, os.SEEK_SET)

4034

sdfh.write(serialized_sidedata)

4038

sdfh.write(serialized_sidedata)

4035

new_entries.append(entry_update)

4039

new_entries.append(entry_update)

4036

current_offset += len(serialized_sidedata)

4040

current_offset += len(serialized_sidedata)

4037

self._docket.sidedata_end = sdfh.tell()

4041

self._docket.sidedata_end = sdfh.tell()

4038

4042

4039

# rewrite the new index entries

4043

# rewrite the new index entries

4040

ifh.seek(startrev * self.index.entry_size)

4044

ifh.seek(startrev * self.index.entry_size)

4041

for i, e in enumerate(new_entries):

4045

for i, e in enumerate(new_entries):

4042

rev = startrev + i

4046

rev = startrev + i

4043

self.index.replace_sidedata_info(rev, *e)

4047

self.index.replace_sidedata_info(rev, *e)

4044

packed = self.index.entry_binary(rev)

4048

packed = self.index.entry_binary(rev)

4045

if rev == 0 and self._docket is None:

4049

if rev == 0 and self._docket is None:

4046

header = self._format_flags | self._format_version

4050

header = self._format_flags | self._format_version

4047

header = self.index.pack_header(header)

4051

header = self.index.pack_header(header)

4048

packed = header + packed

4052

packed = header + packed

4049

ifh.write(packed)

4053

ifh.write(packed)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             # coding: utf8
             #
             # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             import binascii
             import collections
             import contextlib
             import io
             import os
             import struct
             import weakref
             import zlib
             # import stuff from node for others to import from revlog
             from .node import (
                 bin,
                 hex,
                 nullrev,
                 sha1nodeconstants,
                 short,
                 wdirrev,
             )
             from .i18n import _
             from .revlogutils.constants import (
                 ALL_KINDS,
                 CHANGELOGV2,
                 COMP_MODE_DEFAULT,
                 COMP_MODE_INLINE,
                 COMP_MODE_PLAIN,
                 DELTA_BASE_REUSE_NO,
                 DELTA_BASE_REUSE_TRY,
                 ENTRY_RANK,
                 FEATURES_BY_VERSION,
                 FLAG_GENERALDELTA,
                 FLAG_INLINE_DATA,
                 INDEX_HEADER,
                 KIND_CHANGELOG,
                 KIND_FILELOG,
                 RANK_UNKNOWN,
                 REVLOGV0,
                 REVLOGV1,
                 REVLOGV1_FLAGS,
                 REVLOGV2,
                 REVLOGV2_FLAGS,
                 REVLOG_DEFAULT_FLAGS,
                 REVLOG_DEFAULT_FORMAT,
                 REVLOG_DEFAULT_VERSION,
                 SUPPORTED_FLAGS,
             )
             from .revlogutils.flagutil import (
                 REVIDX_DEFAULT_FLAGS,
                 REVIDX_ELLIPSIS,
                 REVIDX_EXTSTORED,
                 REVIDX_FLAGS_ORDER,
                 REVIDX_HASCOPIESINFO,
                 REVIDX_ISCENSORED,
                 REVIDX_RAWTEXT_CHANGING_FLAGS,
             )
             from .thirdparty import attr
             from . import (
                 ancestor,
                 dagop,
                 error,
                 mdiff,
                 policy,
                 pycompat,
                 revlogutils,
                 templatefilters,
                 util,
             )
             from .interfaces import (
                 repository,
                 util as interfaceutil,
             )
             from .revlogutils import (
                 deltas as deltautil,
                 docket as docketutil,
                 flagutil,
                 nodemap as nodemaputil,
                 randomaccessfile,
                 revlogv0,
                 rewrite,
                 sidedata as sidedatautil,
             )
             from .utils import (
                 storageutil,
                 stringutil,
             )
             # blanked usage of all the name to prevent pyflakes constraints
             # We need these name available in the module for extensions.
             REVLOGV0
             REVLOGV1
             REVLOGV2
             CHANGELOGV2
             FLAG_INLINE_DATA
             FLAG_GENERALDELTA
             REVLOG_DEFAULT_FLAGS
             REVLOG_DEFAULT_FORMAT
             REVLOG_DEFAULT_VERSION
             REVLOGV1_FLAGS
             REVLOGV2_FLAGS
             REVIDX_ISCENSORED
             REVIDX_ELLIPSIS
             REVIDX_HASCOPIESINFO
             REVIDX_EXTSTORED
             REVIDX_DEFAULT_FLAGS
             REVIDX_FLAGS_ORDER
             REVIDX_RAWTEXT_CHANGING_FLAGS
             parsers = policy.importmod('parsers')
             rustancestor = policy.importrust('ancestor')
             rustdagop = policy.importrust('dagop')
             rustrevlog = policy.importrust('revlog')
             # Aliased for performance.
             _zlibdecompress = zlib.decompress
             # max size of inline data embedded into a revlog
             _maxinline = 131072
             # Flag processors for REVIDX_ELLIPSIS.
             def ellipsisreadprocessor(rl, text):
                 return text, False
             def ellipsiswriteprocessor(rl, text):
                 return text, False
             def ellipsisrawprocessor(rl, text):
                 return False
             ellipsisprocessor = (
                 ellipsisreadprocessor,
                 ellipsiswriteprocessor,
                 ellipsisrawprocessor,
             )
             def _verify_revision(rl, skipflags, state, node):
                 """Verify the integrity of the given revlog ``node`` while providing a hook
                 point for extensions to influence the operation."""
                 if skipflags:
                     state[b'skipread'].add(node)
                 else:
                     # Side-effect: read content and verify hash.
                     rl.revision(node)
             # True if a fast implementation for persistent-nodemap is available
             #
             # We also consider we have a "fast" implementation in "pure" python because
             # people using pure don't really have performance consideration (and a
             # wheelbarrow of other slowness source)
             HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(
                 parsers, 'BaseIndexObject'
             )
             @interfaceutil.implementer(repository.irevisiondelta)
             @attr.s(slots=True)
             class revlogrevisiondelta:
                 node = attr.ib()
                 p1node = attr.ib()
                 p2node = attr.ib()
                 basenode = attr.ib()
                 flags = attr.ib()
                 baserevisionsize = attr.ib()
                 revision = attr.ib()
                 delta = attr.ib()
                 sidedata = attr.ib()
                 protocol_flags = attr.ib()
                 linknode = attr.ib(default=None)
             @interfaceutil.implementer(repository.iverifyproblem)
             @attr.s(frozen=True)
             class revlogproblem:
                 warning = attr.ib(default=None)
                 error = attr.ib(default=None)
                 node = attr.ib(default=None)
             def parse_index_v1(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline)
                 return index, cache
             def parse_index_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)
                 return index, cache
             def parse_index_cl_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)
                 return index, cache
             if hasattr(parsers, 'parse_index_devel_nodemap'):
                 def parse_index_v1_nodemap(data, inline):
                     index, cache = parsers.parse_index_devel_nodemap(data, inline)
                     return index, cache
             else:
                 parse_index_v1_nodemap = None
             def parse_index_v1_mixed(data, inline):
                 index, cache = parse_index_v1(data, inline)
                 return rustrevlog.MixedIndex(index), cache
             # corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
             # signed integer)
             _maxentrysize = 0x7FFFFFFF
             FILE_TOO_SHORT_MSG = _(
                 b'cannot read from revlog %s;'
                 b'  expected %d bytes from offset %d, data size is %d'
             )
             hexdigits = b'0123456789abcdefABCDEF'
             class _Config:
                 def copy(self):
                     return self.__class__(**self.__dict__)
             @attr.s()
             class FeatureConfig(_Config):
                 """Hold configuration values about the available revlog features"""
                 # the default compression engine
                 compression_engine = attr.ib(default=b'zlib')
                 # compression engines options
                 compression_engine_options = attr.ib(default=attr.Factory(dict))
                 # can we use censor on this revlog
                 censorable = attr.ib(default=False)
                 # does this revlog use the "side data" feature
                 has_side_data = attr.ib(default=False)
                 # might remove rank configuration once the computation has no impact
                 compute_rank = attr.ib(default=False)
                 # parent order is supposed to be semantically irrelevant, so we
                 # normally resort parents to ensure that the first parent is non-null,
                 # if there is a non-null parent at all.
                 # filelog abuses the parent order as flag to mark some instances of
                 # meta-encoded files, so allow it to disable this behavior.
                 canonical_parent_order = attr.ib(default=False)
                 # can ellipsis commit be used
                 enable_ellipsis = attr.ib(default=False)
                 def copy(self):
                     new = super().copy()
                     new.compression_engine_options = self.compression_engine_options.copy()
                     return new
             @attr.s()
             class DataConfig(_Config):
                 """Hold configuration value about how the revlog data are read"""
                 # should we try to open the "pending" version of the revlog
                 try_pending = attr.ib(default=False)
                 # should we try to open the "splitted" version of the revlog
                 try_split = attr.ib(default=False)
                 #  When True, indexfile should be opened with checkambig=True at writing,
                 #  to avoid file stat ambiguity.
                 check_ambig = attr.ib(default=False)
                 # If true, use mmap instead of reading to deal with large index
                 mmap_large_index = attr.ib(default=False)
                 # how much data is large
                 mmap_index_threshold = attr.ib(default=None)
                 # How much data to read and cache into the raw revlog data cache.
                 chunk_cache_size = attr.ib(default=65536)
                 # Allow sparse reading of the revlog data
                 with_sparse_read = attr.ib(default=False)
                 # minimal density of a sparse read chunk
                 sr_density_threshold = attr.ib(default=0.50)
                 # minimal size of data we skip when performing sparse read
                 sr_min_gap_size = attr.ib(default=262144)
                 # are delta encoded against arbitrary bases.
                 generaldelta = attr.ib(default=False)
             @attr.s()
             class DeltaConfig(_Config):
                 """Hold configuration value about how new delta are computed
                 Some attributes are duplicated from DataConfig to help havign each object
                 self contained.
                 """
                 # can delta be encoded against arbitrary bases.
                 general_delta = attr.ib(default=False)
                 # Allow sparse writing of the revlog data
                 sparse_revlog = attr.ib(default=False)
                 # maximum length of a delta chain
                 max_chain_len = attr.ib(default=None)
                 # Maximum distance between delta chain base start and end
                 max_deltachain_span = attr.ib(default=-1)
                 # If `upper_bound_comp` is not None, this is the expected maximal gain from
                 # compression for the data content.
                 upper_bound_comp = attr.ib(default=None)
                 # Should we try a delta against both parent
                 delta_both_parents = attr.ib(default=True)
                 # Test delta base candidate group by chunk of this maximal size.
                 candidate_group_chunk_size = attr.ib(default=0)
                 # Should we display debug information about delta computation
                 debug_delta = attr.ib(default=False)
                 # trust incoming delta by default
                 lazy_delta = attr.ib(default=True)
                 # trust the base of incoming delta by default
                 lazy_delta_base = attr.ib(default=False)
             class _InnerRevlog:
                 """An inner layer of the revlog object
                 That layer exist to be able to delegate some operation to Rust, its
                 boundaries are arbitrary and based on what we can delegate to Rust.
                 """
                 def __init__(
                     self,
                     opener,
                     index,
                     index_file,
                     data_file,
                     sidedata_file,
                     inline,
                     data_config,
                     delta_config,
                     feature_config,
                     chunk_cache,
                     default_compression_header,
                 ):
                     self.opener = opener
                     self.index = index
                     self.__index_file = index_file
                     self.data_file = data_file
                     self.sidedata_file = sidedata_file
                     self.inline = inline
                     self.data_config = data_config
                     self.delta_config = delta_config
                     self.feature_config = feature_config
                     self._default_compression_header = default_compression_header
                     # index
                     # 3-tuple of file handles being used for active writing.
                     self._writinghandles = None
                     self._segmentfile = randomaccessfile.randomaccessfile(
                         self.opener,
                         (self.index_file if self.inline else self.data_file),
                         self.data_config.chunk_cache_size,
                         chunk_cache,
                     )
                     self._segmentfile_sidedata = randomaccessfile.randomaccessfile(
                         self.opener,
                         self.sidedata_file,
                         self.data_config.chunk_cache_size,
                     )
                     # revlog header -> revlog compressor
                     self._decompressors = {}
                     # 3-tuple of (node, rev, text) for a raw revision.
                     self._revisioncache = None
                 @property
                 def index_file(self):
                     return self.__index_file
                 @index_file.setter
                 def index_file(self, new_index_file):
                     self.__index_file = new_index_file
                     if self.inline:
                         self._segmentfile.filename = new_index_file
                 def __len__(self):
                     return len(self.index)
                 def clear_cache(self):
                     self._revisioncache = None
                     self._segmentfile.clear_cache()
                     self._segmentfile_sidedata.clear_cache()
+                @property
+                def canonical_index_file(self):
+                    return self.index_file
                 # Derived from index values.
                 def start(self, rev):
                     """the offset of the data chunk for this revision"""
                     return int(self.index[rev][0] >> 16)
                 def length(self, rev):
                     """the length of the data chunk for this revision"""
                     return self.index[rev][1]
                 def end(self, rev):
                     """the end of the data chunk for this revision"""
                     return self.start(rev) + self.length(rev)
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self.delta_config.general_delta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     if not self.delta_config.sparse_revlog:
                         return self.deltaparent(rev) == nullrev
                     elif hasattr(self.index, 'issnapshot'):
                         # directly assign the method to cache the testing and access
                         self.issnapshot = self.index.issnapshot
                         return self.issnapshot(rev)
                     if rev == nullrev:
                         return True
                     entry = self.index[rev]
                     base = entry[3]
                     if base == rev:
                         return True
                     if base == nullrev:
                         return True
                     p1 = entry[5]
                     while self.length(p1) == 0:
                         b = self.deltaparent(p1)
                         if b == p1:
                             break
                         p1 = b
                     p2 = entry[6]
                     while self.length(p2) == 0:
                         b = self.deltaparent(p2)
                         if b == p2:
                             break
                         p2 = b
                     if base == p1 or base == p2:
                         return False
                     return self.issnapshot(base)
                 def _deltachain(self, rev, stoprev=None):
                     """Obtain the delta chain for a revision.
                     ``stoprev`` specifies a revision to stop at. If not specified, we
                     stop at the base of the chain.
                     Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
                     revs in ascending order and ``stopped`` is a bool indicating whether
                     ``stoprev`` was hit.
                     """
                     generaldelta = self.delta_config.general_delta
                     # Try C implementation.
                     try:
                         return self.index.deltachain(rev, stoprev, generaldelta)
                     except AttributeError:
                         pass
                     chain = []
                     # Alias to prevent attribute lookup in tight loop.
                     index = self.index
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != stoprev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == stoprev:
                         stopped = True
                     else:
                         chain.append(iterrev)
                         stopped = False
                     chain.reverse()
                     return chain, stopped
                 @util.propertycache
                 def _compressor(self):
                     engine = util.compengines[self.feature_config.compression_engine]
                     return engine.revlogcompressor(
                         self.feature_config.compression_engine_options
                     )
                 @util.propertycache
                 def _decompressor(self):
                     """the default decompressor"""
                     if self._default_compression_header is None:
                         return None
                     t = self._default_compression_header
                     c = self._get_decompressor(t)
                     return c.decompress
                 def _get_decompressor(self, t):
                     try:
                         compressor = self._decompressors[t]
                     except KeyError:
                         try:
                             engine = util.compengines.forrevlogheader(t)
                             compressor = engine.revlogcompressor(
                                 self.feature_config.compression_engine_options
                             )
                             self._decompressors[t] = compressor
                         except KeyError:
                             raise error.RevlogError(
                                 _(b'unknown compression type %s') % binascii.hexlify(t)
                             )
                     return compressor
                 def compress(self, data):
                     """Generate a possibly-compressed representation of data."""
                     if not data:
                         return b'', data
                     compressed = self._compressor.compress(data)
                     if compressed:
                         # The revlog compressor added the header in the returned data.
                         return b'', compressed
                     if data[0:1] == b'\0':
                         return b'', data
                     return b'u', data
                 def decompress(self, data):
                     """Decompress a revlog chunk.
                     The chunk is expected to begin with a header identifying the
                     format type so it can be routed to an appropriate decompressor.
                     """
                     if not data:
                         return data
                     # Revlogs are read much more frequently than they are written and many
                     # chunks only take microseconds to decompress, so performance is
                     # important here.
                     #
                     # We can make a few assumptions about revlogs:
                     #
                     # 1) the majority of chunks will be compressed (as opposed to inline
                     #    raw data).
                     # 2) decompressing *any* data will likely by at least 10x slower than
                     #    returning raw inline data.
                     # 3) we want to prioritize common and officially supported compression
                     #    engines
                     #
                     # It follows that we want to optimize for "decompress compressed data
                     # when encoded with common and officially supported compression engines"
                     # case over "raw data" and "data encoded by less common or non-official
                     # compression engines." That is why we have the inline lookup first
                     # followed by the compengines lookup.
                     #
                     # According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
                     # compressed chunks. And this matters for changelog and manifest reads.
                     t = data[0:1]
                     if t == b'x':
                         try:
                             return _zlibdecompress(data)
                         except zlib.error as e:
                             raise error.RevlogError(
                                 _(b'revlog decompress error: %s')
                                 % stringutil.forcebytestr(e)
                             )
                     # '\0' is more common than 'u' so it goes first.
                     elif t == b'\0':
                         return data
                     elif t == b'u':
                         return util.buffer(data, 1)
                     compressor = self._get_decompressor(t)
                     return compressor.decompress(data)
                 @contextlib.contextmanager
                 def reading(self):
                     """Context manager that keeps data and sidedata files open for reading"""
                     if len(self.index) == 0:
                         yield  # nothing to be read
                     else:
                         with self._segmentfile.reading():
                             with self._segmentfile_sidedata.reading():
                                 yield
                 @property
                 def is_writing(self):
                     """True is a writing context is open"""
                     return self._writinghandles is not None
                 @property
                 def is_open(self):
                     """True if any file handle is being held
                     Used for assert and debug in the python code"""
                     return self._segmentfile.is_open or self._segmentfile_sidedata.is_open
                 @contextlib.contextmanager
                 def writing(self, transaction, data_end=None, sidedata_end=None):
                     """Open the revlog files for writing
                     Add content to a revlog should be done within such context.
                     """
                     if self.is_writing:
                         yield
                     else:
                         ifh = dfh = sdfh = None
                         try:
                             r = len(self.index)
                             # opening the data file.
                             dsize = 0
                             if r:
                                 dsize = self.end(r - 1)
                             dfh = None
                             if not self.inline:
                                 try:
                                     dfh = self.opener(self.data_file, mode=b"r+")
                                     if data_end is None:
                                         dfh.seek(0, os.SEEK_END)
                                     else:
                                         dfh.seek(data_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     dfh = self.opener(self.data_file, mode=b"w+")
                                 transaction.add(self.data_file, dsize)
                             if self.sidedata_file is not None:
                                 assert sidedata_end is not None
                                 # revlog-v2 does not inline, help Pytype
                                 assert dfh is not None
                                 try:
                                     sdfh = self.opener(self.sidedata_file, mode=b"r+")
                                     dfh.seek(sidedata_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     sdfh = self.opener(self.sidedata_file, mode=b"w+")
                                 transaction.add(self.sidedata_file, sidedata_end)
                             # opening the index file.
                             isize = r * self.index.entry_size
                             ifh = self.__index_write_fp()
                             if self.inline:
                                 transaction.add(self.index_file, dsize + isize)
                             else:
                                 transaction.add(self.index_file, isize)
                             # exposing all file handle for writing.
                             self._writinghandles = (ifh, dfh, sdfh)
                             self._segmentfile.writing_handle = ifh if self.inline else dfh
                             self._segmentfile_sidedata.writing_handle = sdfh
                             yield
                         finally:
                             self._writinghandles = None
                             self._segmentfile.writing_handle = None
                             self._segmentfile_sidedata.writing_handle = None
                             if dfh is not None:
                                 dfh.close()
                             if sdfh is not None:
                                 sdfh.close()
                             # closing the index file last to avoid exposing referent to
                             # potential unflushed data content.
                             if ifh is not None:
                                 ifh.close()
                 def __index_write_fp(self, index_end=None):
                     """internal method to open the index file for writing
                     You should not use this directly and use `_writing` instead
                     """
                     try:
                         f = self.opener(
                             self.index_file,
                             mode=b"r+",
                             checkambig=self.data_config.check_ambig,
                         )
                         if index_end is None:
                             f.seek(0, os.SEEK_END)
                         else:
                             f.seek(index_end, os.SEEK_SET)
                         return f
                     except FileNotFoundError:
                         return self.opener(
                             self.index_file,
                             mode=b"w+",
                             checkambig=self.data_config.check_ambig,
                         )
                 def __index_new_fp(self):
                     """internal method to create a new index file for writing
                     You should not use this unless you are upgrading from inline revlog
                     """
                     return self.opener(
                         self.index_file,
                         mode=b"w",
                         checkambig=self.data_config.check_ambig,
                         atomictemp=True,
                     )
                 def split_inline(self, tr, header, new_index_file_path=None):
                     """split the data of an inline revlog into an index and a data file"""
                     existing_handles = False
                     if self._writinghandles is not None:
                         existing_handles = True
                         fp = self._writinghandles[0]
                         fp.flush()
                         fp.close()
                         # We can't use the cached file handle after close(). So prevent
                         # its usage.
                         self._writinghandles = None
                         self._segmentfile.writing_handle = None
                         # No need to deal with sidedata writing handle as it is only
                         # relevant with revlog-v2 which is never inline, not reaching
                         # this code
                     new_dfh = self.opener(self.data_file, mode=b"w+")
                     new_dfh.truncate(0)  # drop any potentially existing data
                     try:
                         with self.reading():
                             for r in range(len(self.index)):
                                 new_dfh.write(self.get_segment_for_revs(r, r)[1])
                             new_dfh.flush()
                         if new_index_file_path is not None:
                             self.index_file = new_index_file_path
                         with self.__index_new_fp() as fp:
                             self.inline = False
                             for i in range(len(self.index)):
                                 e = self.index.entry_binary(i)
                                 if i == 0:
                                     packed_header = self.index.pack_header(header)
                                     e = packed_header + e
                                 fp.write(e)
                             # If we don't use side-write, the temp file replace the real
                             # index when we exit the context manager
                         self._segmentfile = randomaccessfile.randomaccessfile(
                             self.opener,
                             self.data_file,
                             self.data_config.chunk_cache_size,
                         )
                         if existing_handles:
                             # switched from inline to conventional reopen the index
                             ifh = self.__index_write_fp()
                             self._writinghandles = (ifh, new_dfh, None)
                             self._segmentfile.writing_handle = new_dfh
                             new_dfh = None
                             # No need to deal with sidedata writing handle as it is only
                             # relevant with revlog-v2 which is never inline, not reaching
                             # this code
                     finally:
                         if new_dfh is not None:
                             new_dfh.close()
                     return self.index_file
                 def get_segment_for_revs(self, startrev, endrev):
                     """Obtain a segment of raw data corresponding to a range of revisions.
                     Accepts the start and end revisions and an optional already-open
                     file handle to be used for reading. If the file handle is read, its
                     seek position will not be preserved.
                     Requests for data may be satisfied by a cache.
                     Returns a 2-tuple of (offset, data) for the requested range of
                     revisions. Offset is the integer offset from the beginning of the
                     revlog and data is a str or buffer of the raw byte data.
                     Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
                     to determine where each revision's data begins and ends.
                     API: we should consider making this a private part of the InnerRevlog
                     at some point.
                     """
                     # Inlined self.start(startrev) & self.end(endrev) for perf reasons
                     # (functions are expensive).
                     index = self.index
                     istart = index[startrev]
                     start = int(istart[0] >> 16)
                     if startrev == endrev:
                         end = start + istart[1]
                     else:
                         iend = index[endrev]
                         end = int(iend[0] >> 16) + iend[1]
                     if self.inline:
                         start += (startrev + 1) * self.index.entry_size
                         end += (endrev + 1) * self.index.entry_size
                     length = end - start
                     return start, self._segmentfile.read_chunk(start, length)
                 def _chunk(self, rev):
                     """Obtain a single decompressed chunk for a revision.
                     Accepts an integer revision and an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will not
                     be preserved.
                     Returns a str holding uncompressed data for the requested revision.
                     """
                     compression_mode = self.index[rev][10]
                     data = self.get_segment_for_revs(rev, rev)[1]
                     if compression_mode == COMP_MODE_PLAIN:
                         return data
                     elif compression_mode == COMP_MODE_DEFAULT:
                         return self._decompressor(data)
                     elif compression_mode == COMP_MODE_INLINE:
                         return self.decompress(data)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= compression_mode
                         raise error.RevlogError(msg)
                 def _chunks(self, revs, targetsize=None):
                     """Obtain decompressed chunks for the specified revisions.
                     Accepts an iterable of numeric revisions that are assumed to be in
                     ascending order. Also accepts an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will
                     not be preserved.
                     This function is similar to calling ``self._chunk()`` multiple times,
                     but is faster.
                     Returns a list with decompressed data for each requested revision.
                     """
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self.inline
                     iosize = self.index.entry_size
                     buffer = util.buffer
                     l = []
                     ladd = l.append
                     if not self.data_config.with_sparse_read:
                         slicedchunks = (revs,)
                     else:
                         slicedchunks = deltautil.slicechunk(
                             self,
                             revs,
                             targetsize=targetsize,
                         )
                     for revschunk in slicedchunks:
                         firstrev = revschunk[0]
                         # Skip trailing revisions with empty diff
                         for lastrev in revschunk[::-1]:
                             if length(lastrev) != 0:
                                 break
                         try:
                             offset, data = self.get_segment_for_revs(firstrev, lastrev)
                         except OverflowError:
                             # issue4215 - we can't cache a run of chunks greater than
                             # 2G on Windows
                             return [self._chunk(rev) for rev in revschunk]
                         decomp = self.decompress
                         # self._decompressor might be None, but will not be used in that case
                         def_decomp = self._decompressor
                         for rev in revschunk:
                             chunkstart = start(rev)
                             if inline:
                                 chunkstart += (rev + 1) * iosize
                             chunklength = length(rev)
                             comp_mode = self.index[rev][10]
                             c = buffer(data, chunkstart - offset, chunklength)
                             if comp_mode == COMP_MODE_PLAIN:
                                 ladd(c)
                             elif comp_mode == COMP_MODE_INLINE:
                                 ladd(decomp(c))
                             elif comp_mode == COMP_MODE_DEFAULT:
                                 ladd(def_decomp(c))
                             else:
                                 msg = b'unknown compression mode %d'
                                 msg %= comp_mode
                                 raise error.RevlogError(msg)
                     return l
                 def raw_text(self, node, rev):
                     """return the possibly unvalidated rawtext for a revision
                     returns (rev, rawtext, validated)
                     """
                     # revision in the cache (could be useful to apply delta)
                     cachedrev = None
                     # An intermediate text to apply deltas to
                     basetext = None
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._revisioncache:
                         cachedrev = self._revisioncache[1]
                     chain, stopped = self._deltachain(rev, stoprev=cachedrev)
                     if stopped:
                         basetext = self._revisioncache[2]
                     # drop cache to save memory, the caller is expected to
                     # update self._inner._revisioncache after validating the text
                     self._revisioncache = None
                     targetsize = None
                     rawsize = self.index[rev][2]
                     if 0 <= rawsize:
                         targetsize = 4 * rawsize
                     bins = self._chunks(chain, targetsize=targetsize)
                     if basetext is None:
                         basetext = bytes(bins[0])
                         bins = bins[1:]
                     rawtext = mdiff.patches(basetext, bins)
                     del basetext  # let us have a chance to free memory early
                     return (rev, rawtext, False)
                 def sidedata(self, rev, sidedata_end):
                     """Return the sidedata for a given revision number."""
                     index_entry = self.index[rev]
                     sidedata_offset = index_entry[8]
                     sidedata_size = index_entry[9]
                     if self.inline:
                         sidedata_offset += self.index.entry_size * (1 + rev)
                     if sidedata_size == 0:
                         return {}
                     if sidedata_end < sidedata_offset + sidedata_size:
                         filename = self.sidedata_file
                         end = sidedata_end
                         offset = sidedata_offset
                         length = sidedata_size
                         m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)
                         raise error.RevlogError(m)
                     comp_segment = self._segmentfile_sidedata.read_chunk(
                         sidedata_offset, sidedata_size
                     )
                     comp = self.index[rev][11]
                     if comp == COMP_MODE_PLAIN:
                         segment = comp_segment
                     elif comp == COMP_MODE_DEFAULT:
                         segment = self._decompressor(comp_segment)
                     elif comp == COMP_MODE_INLINE:
                         segment = self.decompress(comp_segment)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= comp
                         raise error.RevlogError(msg)
                     sidedata = sidedatautil.deserialize_sidedata(segment)
                     return sidedata
                 def write_entry(
                     self,
                     transaction,
                     entry,
                     data,
                     link,
                     offset,
                     sidedata,
                     sidedata_offset,
                     index_end,
                     data_end,
                     sidedata_end,
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     if self._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     ifh, dfh, sdfh = self._writinghandles
                     if index_end is None:
                         ifh.seek(0, os.SEEK_END)
                     else:
                         ifh.seek(index_end, os.SEEK_SET)
                     if dfh:
                         if data_end is None:
                             dfh.seek(0, os.SEEK_END)
                         else:
                             dfh.seek(data_end, os.SEEK_SET)
                     if sdfh:
                         sdfh.seek(sidedata_end, os.SEEK_SET)
                     curr = len(self.index) - 1
                     if not self.inline:
                         transaction.add(self.data_file, offset)
                         if self.sidedata_file:
                             transaction.add(self.sidedata_file, sidedata_offset)
-                        transaction.add(self.index_file, curr * len(entry))
+                        transaction.add(self.canonical_index_file, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         if sidedata:
                             sdfh.write(sidedata)
                         ifh.write(entry)
                     else:
                         offset += curr * self.index.entry_size
-                        transaction.add(self.index_file, offset)
+                        transaction.add(self.canonical_index_file, offset)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         assert not sidedata
                     return (
                         ifh.tell(),
                         dfh.tell() if dfh else None,
                         sdfh.tell() if sdfh else None,
                     )
             class revlog:
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 If checkambig, indexfile is opened with checkambig=True at
                 writing, to avoid file stat ambiguity.
                 If mmaplargeindex is True, and an mmapindexthreshold is set, the
                 index will be mmapped rather than read if it is larger than the
                 configured threshold.
                 If censorable is True, the revlog can have censored revisions.
                 If `upperboundcomp` is not None, this is the expected maximal gain from
                 compression for the data content.
                 `concurrencychecker` is an optional function that receives 3 arguments: a
                 file handle, a filename, and an expected position. It should check whether
                 the current position in the file handle is valid, and log/warn/fail (by
                 raising).
                 See mercurial/revlogutils/contants.py for details about the content of an
                 index entry.
                 """
                 _flagserrorclass = error.RevlogError
                 @staticmethod
                 def is_inline_index(header_bytes):
                     """Determine if a revlog is inline from the initial bytes of the index"""
                     header = INDEX_HEADER.unpack(header_bytes)[0]
                     _format_flags = header & ~0xFFFF
                     _format_version = header & 0xFFFF
                     features = FEATURES_BY_VERSION[_format_version]
                     return features[b'inline'](_format_flags)
                 def __init__(
                     self,
                     opener,
                     target,
                     radix,
                     postfix=None,  # only exist for `tmpcensored` now
                     checkambig=False,
                     mmaplargeindex=False,
                     censorable=False,
                     upperboundcomp=None,
                     persistentnodemap=False,
                     concurrencychecker=None,
                     trypending=False,
                     try_split=False,
                     canonical_parent_order=True,
                 ):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     `target`: a (KIND, ID) tuple that identify the content stored in
                     this revlog. It help the rest of the code to understand what the revlog
                     is about without having to resort to heuristic and index filename
                     analysis. Note: that this must be reliably be set by normal code, but
                     that test, debug, or performance measurement code might not set this to
                     accurate value.
                     """
                     self.radix = radix
                     self._docket_file = None
                     self._indexfile = None
                     self._datafile = None
                     self._sidedatafile = None
                     self._nodemap_file = None
                     self.postfix = postfix
                     self._trypending = trypending
                     self._try_split = try_split
                     self.opener = opener
                     if persistentnodemap:
                         self._nodemap_file = nodemaputil.get_nodemap_file(self)
                     assert target[0] in ALL_KINDS
                     assert len(target) == 2
                     self.target = target
                     if b'feature-config' in self.opener.options:
                         self.feature_config = self.opener.options[b'feature-config'].copy()
                     else:
                         self.feature_config = FeatureConfig()
                     self.feature_config.censorable = censorable
                     self.feature_config.canonical_parent_order = canonical_parent_order
                     if b'data-config' in self.opener.options:
                         self.data_config = self.opener.options[b'data-config'].copy()
                     else:
                         self.data_config = DataConfig()
                     self.data_config.check_ambig = checkambig
                     self.data_config.mmap_large_index = mmaplargeindex
                     if b'delta-config' in self.opener.options:
                         self.delta_config = self.opener.options[b'delta-config'].copy()
                     else:
                         self.delta_config = DeltaConfig()
                     self.delta_config.upper_bound_comp = upperboundcomp
                     # Maps rev to chain base rev.
                     self._chainbasecache = util.lrucachedict(100)
                     self.index = None
                     self._docket = None
                     self._nodemap_docket = None
                     # Mapping of partial identifiers to full nodes.
                     self._pcache = {}
                     # other optionnals features
                     # Make copy of flag processors so each revlog instance can support
                     # custom flags.
                     self._flagprocessors = dict(flagutil.flagprocessors)
                     # prevent nesting of addgroup
                     self._adding_group = None
                     chunk_cache = self._loadindex()
                     self._load_inner(chunk_cache)
                     self._concurrencychecker = concurrencychecker
                 @property
                 def _generaldelta(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.general_delta", b"6.6", stacklevel=2
                     )
                     return self.delta_config.general_delta
                 @property
                 def _checkambig(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.checkambig", b"6.6", stacklevel=2
                     )
                     return self.data_config.check_ambig
                 @property
                 def _mmaplargeindex(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.mmap_large_index", b"6.6", stacklevel=2
                     )
                     return self.data_config.mmap_large_index
                 @property
                 def _censorable(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.censorable", b"6.6", stacklevel=2
                     )
                     return self.feature_config.censorable
                 @property
                 def _chunkcachesize(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.chunk_cache_size", b"6.6", stacklevel=2
                     )
                     return self.data_config.chunk_cache_size
                 @property
                 def _maxchainlen(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.max_chain_len", b"6.6", stacklevel=2
                     )
                     return self.delta_config.max_chain_len
                 @property
                 def _deltabothparents(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.delta_both_parents", b"6.6", stacklevel=2
                     )
                     return self.delta_config.delta_both_parents
                 @property
                 def _candidate_group_chunk_size(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.candidate_group_chunk_size",
                         b"6.6",
                         stacklevel=2,
                     )
                     return self.delta_config.candidate_group_chunk_size
                 @property
                 def _debug_delta(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.debug_delta", b"6.6", stacklevel=2
                     )
                     return self.delta_config.debug_delta
                 @property
                 def _compengine(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.compression_engine",
                         b"6.6",
                         stacklevel=2,
                     )
                     return self.feature_config.compression_engine
                 @property
                 def upperboundcomp(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.upper_bound_comp",
                         b"6.6",
                         stacklevel=2,
                     )
                     return self.delta_config.upper_bound_comp
                 @property
                 def _compengineopts(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.compression_engine_options",
                         b"6.6",
                         stacklevel=2,
                     )
                     return self.feature_config.compression_engine_options
                 @property
                 def _maxdeltachainspan(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.max_deltachain_span", b"6.6", stacklevel=2
                     )
                     return self.delta_config.max_deltachain_span
                 @property
                 def _withsparseread(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.with_sparse_read", b"6.6", stacklevel=2
                     )
                     return self.data_config.with_sparse_read
                 @property
                 def _sparserevlog(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.sparse_revlog", b"6.6", stacklevel=2
                     )
                     return self.delta_config.sparse_revlog
                 @property
                 def hassidedata(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.has_side_data", b"6.6", stacklevel=2
                     )
                     return self.feature_config.has_side_data
                 @property
                 def _srdensitythreshold(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.sr_density_threshold",
                         b"6.6",
                         stacklevel=2,
                     )
                     return self.data_config.sr_density_threshold
                 @property
                 def _srmingapsize(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.sr_min_gap_size", b"6.6", stacklevel=2
                     )
                     return self.data_config.sr_min_gap_size
                 @property
                 def _compute_rank(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.compute_rank", b"6.6", stacklevel=2
                     )
                     return self.feature_config.compute_rank
                 @property
                 def canonical_parent_order(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.canonical_parent_order",
                         b"6.6",
                         stacklevel=2,
                     )
                     return self.feature_config.canonical_parent_order
                 @property
                 def _lazydelta(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.lazy_delta", b"6.6", stacklevel=2
                     )
                     return self.delta_config.lazy_delta
                 @property
                 def _lazydeltabase(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.lazy_delta_base", b"6.6", stacklevel=2
                     )
                     return self.delta_config.lazy_delta_base
                 def _init_opts(self):
                     """process options (from above/config) to setup associated default revlog mode
                     These values might be affected when actually reading on disk information.
                     The relevant values are returned for use in _loadindex().
                     * newversionflags:
                         version header to use if we need to create a new revlog
                     * mmapindexthreshold:
                         minimal index size for start to use mmap
                     * force_nodemap:
                         force the usage of a "development" version of the nodemap code
                     """
                     opts = self.opener.options
                     if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:
                         new_header = CHANGELOGV2
                         compute_rank = opts.get(b'changelogv2.compute-rank', True)
                         self.feature_config.compute_rank = compute_rank
                     elif b'revlogv2' in opts:
                         new_header = REVLOGV2
                     elif b'revlogv1' in opts:
                         new_header = REVLOGV1 | FLAG_INLINE_DATA
                         if b'generaldelta' in opts:
                             new_header |= FLAG_GENERALDELTA
                     elif b'revlogv0' in self.opener.options:
                         new_header = REVLOGV0
                     else:
                         new_header = REVLOG_DEFAULT_VERSION
                     mmapindexthreshold = None
                     if self.data_config.mmap_large_index:
                         mmapindexthreshold = self.data_config.mmap_index_threshold
                     if self.feature_config.enable_ellipsis:
                         self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor
                     # revlog v0 doesn't have flag processors
                     for flag, processor in opts.get(b'flagprocessors', {}).items():
                         flagutil.insertflagprocessor(flag, processor, self._flagprocessors)
                     chunk_cache_size = self.data_config.chunk_cache_size
                     if chunk_cache_size <= 0:
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not greater than 0')
                             % chunk_cache_size
                         )
                     elif chunk_cache_size & (chunk_cache_size - 1):
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not a power of 2')
                             % chunk_cache_size
                         )
                     force_nodemap = opts.get(b'devel-force-nodemap', False)
                     return new_header, mmapindexthreshold, force_nodemap
                 def _get_data(self, filepath, mmap_threshold, size=None):
                     """return a file content with or without mmap
                     If the file is missing return the empty string"""
                     try:
                         with self.opener(filepath) as fp:
                             if mmap_threshold is not None:
                                 file_size = self.opener.fstat(fp).st_size
                                 if file_size >= mmap_threshold:
                                     if size is not None:
                                         # avoid potentiel mmap crash
                                         size = min(file_size, size)
                                     # TODO: should .close() to release resources without
                                     # relying on Python GC
                                     if size is None:
                                         return util.buffer(util.mmapread(fp))
                                     else:
                                         return util.buffer(util.mmapread(fp, size))
                             if size is None:
                                 return fp.read()
                             else:
                                 return fp.read(size)
                     except FileNotFoundError:
                         return b''
                 def get_streams(self, max_linkrev, force_inline=False):
                     """return a list of streams that represent this revlog
                     This is used by stream-clone to do bytes to bytes copies of a repository.
                     This streams data for all revisions that refer to a changelog revision up
                     to `max_linkrev`.
                     If `force_inline` is set, it enforces that the stream will represent an inline revlog.
                     It returns is a list of three-tuple:
                         [
                             (filename, bytes_stream, stream_size),
                             …
                         ]
                     """
                     n = len(self)
                     index = self.index
                     while n > 0:
                         linkrev = index[n - 1][4]
                         if linkrev < max_linkrev:
                             break
                         # note: this loop will rarely go through multiple iterations, since
                         # it only traverses commits created during the current streaming
                         # pull operation.
                         #
                         # If this become a problem, using a binary search should cap the
                         # runtime of this.
                         n = n - 1
                     if n == 0:
                         # no data to send
                         return []
                     index_size = n * index.entry_size
                     data_size = self.end(n - 1)
                     # XXX we might have been split (or stripped) since the object
                     # initialization, We need to close this race too, but having a way to
                     # pre-open the file we feed to the revlog and never closing them before
                     # we are done streaming.
                     if self._inline:
                         def get_stream():
                             with self.opener(self._indexfile, mode=b"r") as fp:
                                 yield None
                                 size = index_size + data_size
                                 if size <= 65536:
                                     yield fp.read(size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=size)
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     elif force_inline:
                         def get_stream():
                             with self.reading():
                                 yield None
                                 for rev in range(n):
                                     idx = self.index.entry_binary(rev)
                                     if rev == 0 and self._docket is None:
                                         # re-inject the inline flag
                                         header = self._format_flags
                                         header |= self._format_version
                                         header |= FLAG_INLINE_DATA
                                         header = self.index.pack_header(header)
                                         idx = header + idx
                                     yield idx
                                     yield self._inner.get_segment_for_revs(rev, rev)[1]
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     else:
                         def get_index_stream():
                             with self.opener(self._indexfile, mode=b"r") as fp:
                                 yield None
                                 if index_size <= 65536:
                                     yield fp.read(index_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=index_size)
                         def get_data_stream():
                             with self._datafp() as fp:
                                 yield None
                                 if data_size <= 65536:
                                     yield fp.read(data_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=data_size)
                         index_stream = get_index_stream()
                         next(index_stream)
                         data_stream = get_data_stream()
                         next(data_stream)
                         return [
                             (self._datafile, data_stream, data_size),
                             (self._indexfile, index_stream, index_size),
                         ]
                 def _loadindex(self, docket=None):
                     new_header, mmapindexthreshold, force_nodemap = self._init_opts()
                     if self.postfix is not None:
                         entry_point = b'%s.i.%s' % (self.radix, self.postfix)
                     elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):
                         entry_point = b'%s.i.a' % self.radix
                     elif self._try_split and self.opener.exists(self._split_index_file):
                         entry_point = self._split_index_file
                     else:
                         entry_point = b'%s.i' % self.radix
                     if docket is not None:
                         self._docket = docket
                         self._docket_file = entry_point
                     else:
                         self._initempty = True
                         entry_data = self._get_data(entry_point, mmapindexthreshold)
                         if len(entry_data) > 0:
                             header = INDEX_HEADER.unpack(entry_data[:4])[0]
                             self._initempty = False
                         else:
                             header = new_header
                         self._format_flags = header & ~0xFFFF
                         self._format_version = header & 0xFFFF
                         supported_flags = SUPPORTED_FLAGS.get(self._format_version)
                         if supported_flags is None:
                             msg = _(b'unknown version (%d) in revlog %s')
                             msg %= (self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         elif self._format_flags & ~supported_flags:
                             msg = _(b'unknown flags (%#04x) in version %d revlog %s')
                             display_flag = self._format_flags >> 16
                             msg %= (display_flag, self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         features = FEATURES_BY_VERSION[self._format_version]
                         self._inline = features[b'inline'](self._format_flags)
                         self.delta_config.general_delta = features[b'generaldelta'](
                             self._format_flags
                         )
                         self.feature_config.has_side_data = features[b'sidedata']
                         if not features[b'docket']:
                             self._indexfile = entry_point
                             index_data = entry_data
                         else:
                             self._docket_file = entry_point
                             if self._initempty:
                                 self._docket = docketutil.default_docket(self, header)
                             else:
                                 self._docket = docketutil.parse_docket(
                                     self, entry_data, use_pending=self._trypending
                                 )
                     if self._docket is not None:
                         self._indexfile = self._docket.index_filepath()
                         index_data = b''
                         index_size = self._docket.index_end
                         if index_size > 0:
                             index_data = self._get_data(
                                 self._indexfile, mmapindexthreshold, size=index_size
                             )
                             if len(index_data) < index_size:
                                 msg = _(b'too few index data for %s: got %d, expected %d')
                                 msg %= (self.display_id, len(index_data), index_size)
                                 raise error.RevlogError(msg)
                         self._inline = False
                         # generaldelta implied by version 2 revlogs.
                         self.delta_config.general_delta = True
                         # the logic for persistent nodemap will be dealt with within the
                         # main docket, so disable it for now.
                         self._nodemap_file = None
                     if self._docket is not None:
                         self._datafile = self._docket.data_filepath()
                         self._sidedatafile = self._docket.sidedata_filepath()
                     elif self.postfix is None:
                         self._datafile = b'%s.d' % self.radix
                     else:
                         self._datafile = b'%s.d.%s' % (self.radix, self.postfix)
                     self.nodeconstants = sha1nodeconstants
                     self.nullid = self.nodeconstants.nullid
                     # sparse-revlog can't be on without general-delta (issue6056)
                     if not self.delta_config.general_delta:
                         self.delta_config.sparse_revlog = False
                     self._storedeltachains = True
                     devel_nodemap = (
                         self._nodemap_file
                         and force_nodemap
                         and parse_index_v1_nodemap is not None
                     )
                     use_rust_index = False
                     if rustrevlog is not None:
                         if self._nodemap_file is not None:
                             use_rust_index = True
                         else:
                             use_rust_index = self.opener.options.get(b'rust.index')
                     self._parse_index = parse_index_v1
                     if self._format_version == REVLOGV0:
                         self._parse_index = revlogv0.parse_index_v0
                     elif self._format_version == REVLOGV2:
                         self._parse_index = parse_index_v2
                     elif self._format_version == CHANGELOGV2:
                         self._parse_index = parse_index_cl_v2
                     elif devel_nodemap:
                         self._parse_index = parse_index_v1_nodemap
                     elif use_rust_index:
                         self._parse_index = parse_index_v1_mixed
                     try:
                         d = self._parse_index(index_data, self._inline)
                         index, chunkcache = d
                         use_nodemap = (
                             not self._inline
                             and self._nodemap_file is not None
                             and hasattr(index, 'update_nodemap_data')
                         )
                         if use_nodemap:
                             nodemap_data = nodemaputil.persisted_data(self)
                             if nodemap_data is not None:
                                 docket = nodemap_data[0]
                                 if (
                                     len(d[0]) > docket.tip_rev
                                     and d[0][docket.tip_rev][7] == docket.tip_node
                                 ):
                                     # no changelog tampering
                                     self._nodemap_docket = docket
                                     index.update_nodemap_data(*nodemap_data)
                     except (ValueError, IndexError):
                         raise error.RevlogError(
                             _(b"index %s is corrupted") % self.display_id
                         )
                     self.index = index
                     # revnum -> (chain-length, sum-delta-length)
                     self._chaininfocache = util.lrucachedict(500)
                     return chunkcache
                 def _load_inner(self, chunk_cache):
                     if self._docket is None:
                         default_compression_header = None
                     else:
                         default_compression_header = self._docket.default_compression_header
                     self._inner = _InnerRevlog(
                         opener=self.opener,
                         index=self.index,
                         index_file=self._indexfile,
                         data_file=self._datafile,
                         sidedata_file=self._sidedatafile,
                         inline=self._inline,
                         data_config=self.data_config,
                         delta_config=self.delta_config,
                         feature_config=self.feature_config,
                         chunk_cache=chunk_cache,
                         default_compression_header=default_compression_header,
                     )
                 def get_revlog(self):
                     """simple function to mirror API of other not-really-revlog API"""
                     return self
                 @util.propertycache
                 def revlog_kind(self):
                     return self.target[0]
                 @util.propertycache
                 def display_id(self):
                     """The public facing "ID" of the revlog that we use in message"""
                     if self.revlog_kind == KIND_FILELOG:
                         # Reference the file without the "data/" prefix, so it is familiar
                         # to the user.
                         return self.target[1]
                     else:
                         return self.radix
                 def _datafp(self, mode=b'r'):
                     """file object for the revlog's data file"""
                     return self.opener(self._datafile, mode=mode)
                 def tiprev(self):
                     return len(self.index) - 1
                 def tip(self):
                     return self.node(self.tiprev())
                 def __contains__(self, rev):
                     return 0 <= rev < len(self)
                 def __len__(self):
                     return len(self.index)
                 def __iter__(self):
                     return iter(range(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     return storageutil.iterrevs(len(self), start=start, stop=stop)
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def _candelta(self, baserev, rev):
                     """whether two revisions (baserev, rev) can be delta-ed or not"""
                     # Disable delta if either rev requires a content-changing flag
                     # processor (ex. LFS). This is because such flag processor can alter
                     # the rawtext content that the delta will be based on, and two clients
                     # could have a same revlog node with different flags (i.e. different
                     # rawtext contents) and the delta could be incompatible.
                     if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (
                         self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS
                     ):
                         return False
                     return True
                 def update_caches(self, transaction):
                     """update on disk cache
                     If a transaction is passed, the update may be delayed to transaction
                     commit."""
                     if self._nodemap_file is not None:
                         if transaction is None:
                             nodemaputil.update_persistent_nodemap(self)
                         else:
                             nodemaputil.setup_persistent_nodemap(transaction, self)
                 def clearcaches(self):
                     """Clear in-memory caches"""
                     self._chainbasecache.clear()
                     self._inner.clear_cache()
                     self._pcache = {}
                     self._nodemap_docket = None
                     self.index.clearcaches()
                     # The python code is the one responsible for validating the docket, we
                     # end up having to refresh it here.
                     use_nodemap = (
                         not self._inline
                         and self._nodemap_file is not None
                         and hasattr(self.index, 'update_nodemap_data')
                     )
                     if use_nodemap:
                         nodemap_data = nodemaputil.persisted_data(self)
                         if nodemap_data is not None:
                             self._nodemap_docket = nodemap_data[0]
                             self.index.update_nodemap_data(*nodemap_data)
                 def rev(self, node):
                     """return the revision number associated with a <nodeid>"""
                     try:
                         return self.index.rev(node)
                     except TypeError:
                         raise
                     except error.RevlogError:
                         # parsers.c radix tree lookup failed
                         if (
                             node == self.nodeconstants.wdirid
                             or node in self.nodeconstants.wdirfilenodeids
                         ):
                             raise error.WdirUnsupported
                         raise error.LookupError(node, self.display_id, _(b'no node'))
                 # Accessors for index entries.
                 # First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
                 # are flags.
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def sidedata_cut_off(self, rev):
                     sd_cut_off = self.index[rev][8]
                     if sd_cut_off != 0:
                         return sd_cut_off
                     # This is some annoying dance, because entries without sidedata
                     # currently use 0 as their ofsset. (instead of previous-offset +
                     # previous-size)
                     #
                     # We should reconsider this sidedata → 0 sidata_offset policy.
                     # In the meantime, we need this.
                     while 0 <= rev:
                         e = self.index[rev]
                         if e[9] != 0:
                             return e[8] + e[9]
                         rev -= 1
                     return 0
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def length(self, rev):
                     return self.index[rev][1]
                 def sidedata_length(self, rev):
                     if not self.feature_config.has_side_data:
                         return 0
                     return self.index[rev][9]
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.rawdata(rev)
                     return len(t)
                 def size(self, rev):
                     """length of non-raw text (processed by a "read" flag processor)"""
                     # fast path: if no "read" flag processor could change the content,
                     # size is rawsize. note: ELLIPSIS is known to not change the content.
                     flags = self.flags(rev)
                     if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
                         return self.rawsize(rev)
                     return len(self.revision(rev))
                 def fast_rank(self, rev):
                     """Return the rank of a revision if already known, or None otherwise.
                     The rank of a revision is the size of the sub-graph it defines as a
                     head. Equivalently, the rank of a revision `r` is the size of the set
                     `ancestors(r)`, `r` included.
                     This method returns the rank retrieved from the revlog in constant
                     time. It makes no attempt at computing unknown values for versions of
                     the revlog which do not persist the rank.
                     """
                     rank = self.index[rev][ENTRY_RANK]
                     if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:
                         return None
                     if rev == nullrev:
                         return 0  # convention
                     return rank
                 def chainbase(self, rev):
                     base = self._chainbasecache.get(rev)
                     if base is not None:
                         return base
                     index = self.index
                     iterrev = rev
                     base = index[iterrev][3]
                     while base != iterrev:
                         iterrev = base
                         base = index[iterrev][3]
                     self._chainbasecache[rev] = base
                     return base
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parentrevs(self, rev):
                     try:
                         entry = self.index[rev]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                     if self.feature_config.canonical_parent_order and entry[5] == nullrev:
                         return entry[6], entry[5]
                     else:
                         return entry[5], entry[6]
                 # fast parentrevs(rev) where rev isn't filtered
                 _uncheckedparentrevs = parentrevs
                 def node(self, rev):
                     try:
                         return self.index[rev][7]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                 # Derived from index values.
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     # inline node() to avoid function call overhead
                     if self.feature_config.canonical_parent_order and d[5] == self.nullid:
                         return i[d[6]][7], i[d[5]][7]
                     else:
                         return i[d[5]][7], i[d[6]][7]
                 def chainlen(self, rev):
                     return self._chaininfo(rev)[0]
                 def _chaininfo(self, rev):
                     chaininfocache = self._chaininfocache
                     if rev in chaininfocache:
                         return chaininfocache[rev]
                     index = self.index
                     generaldelta = self.delta_config.general_delta
                     iterrev = rev
                     e = index[iterrev]
                     clen = 0
                     compresseddeltalen = 0
                     while iterrev != e[3]:
                         clen += 1
                         compresseddeltalen += e[1]
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         if iterrev in chaininfocache:
                             t = chaininfocache[iterrev]
                             clen += t[0]
                             compresseddeltalen += t[1]
                             break
                         e = index[iterrev]
                     else:
                         # Add text length of base since decompressing that also takes
                         # work. For cache hits the length is already included.
                         compresseddeltalen += e[1]
                     r = (clen, compresseddeltalen)
                     chaininfocache[rev] = r
                     return r
                 def _deltachain(self, rev, stoprev=None):
                     return self._inner._deltachain(rev, stoprev=stoprev)
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse revision order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     # first, make sure start revisions aren't filtered
                     revs = list(revs)
                     checkrev = self.node
                     for r in revs:
                         checkrev(r)
                     # and we're sure ancestors aren't filtered as well
                     if rustancestor is not None and self.index.rust_ext_compat:
                         lazyancestors = rustancestor.LazyAncestors
                         arg = self.index
                     else:
                         lazyancestors = ancestor.lazyancestors
                         arg = self._uncheckedparentrevs
                     return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)
                 def descendants(self, revs):
                     return dagop.descendantrevs(revs, self.revs, self.parentrevs)
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset:
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = collections.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(miss) for miss in missing]
                 def incrementalmissingrevs(self, common=None):
                     """Return an object that can be used to incrementally compute the
                     revision numbers of the ancestors of arbitrary sets that are not
                     ancestors of common. This is an ancestor.incrementalmissingancestors
                     object.
                     'common' is a list of revision numbers. If common is not supplied, uses
                     nullrev.
                     """
                     if common is None:
                         common = [nullrev]
                     if rustancestor is not None and self.index.rust_ext_compat:
                         return rustancestor.MissingAncestors(self.index, common)
                     return ancestor.incrementalmissingancestors(self.parentrevs, common)
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     inc = self.incrementalmissingrevs(common=common)
                     return inc.missingancestors(heads)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     inc = self.incrementalmissingrevs(common=common)
                     return [self.node(r) for r in inc.missingancestors(heads)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [self.nullid]  # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return (
                             [self.node(r) for r in self],
                             [self.nullid],
                             list(self.heads()),
                         )
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == self.nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n)  # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update(
                                         [p for p in self.parents(n) if p != self.nullid]
                                     )
                                 elif n in heads:  # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [root for root in roots if root in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(root) for root in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [self.nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [head for head, flag in heads.items() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self, revs=None):
                     if revs is None:
                         try:
                             return self.index.headrevs()
                         except AttributeError:
                             return self._headrevs()
                     if rustdagop is not None and self.index.rust_ext_compat:
                         return rustdagop.headrevs(self.index, revs)
                     return dagop.headrevs(revs, self._uncheckedparentrevs)
                 def computephases(self, roots):
                     return self.index.computephasesmapsets(roots)
                 def _headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     # we won't iter over filtered rev so nobody is a head at start
                     ishead = [0] * (count + 1)
                     index = self.index
                     for r in self:
                         ishead[r] = 1  # I may be an head
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                     return [r for r, val in enumerate(ishead) if val]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [self.nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullrev
                     else:
                         start = self.rev(start)
                     stoprevs = {self.rev(n) for n in stop or []}
                     revs = dagop.headrevssubset(
                         self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs
                     )
                     return [self.node(rev) for rev in revs]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     ancs = self._commonancestorsheads(a, b)
                     return pycompat.maplist(self.node, ancs)
                 def _commonancestorsheads(self, *revs):
                     """calculate all the heads of the common ancestors of revs"""
                     try:
                         ancs = self.index.commonancestorsheads(*revs)
                     except (AttributeError, OverflowError):  # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
                     return ancs
                 def isancestor(self, a, b):
                     """return True if node a is an ancestor of node b
                     A revision is considered an ancestor of itself."""
                     a, b = self.rev(a), self.rev(b)
                     return self.isancestorrev(a, b)
                 def isancestorrev(self, a, b):
                     """return True if revision a is an ancestor of revision b
                     A revision is considered an ancestor of itself.
                     The implementation of this is trivial but the use of
                     reachableroots is not."""
                     if a == nullrev:
                         return True
                     elif a == b:
                         return True
                     elif a > b:
                         return False
                     return bool(self.reachableroots(a, [b], [a], includepath=False))
                 def reachableroots(self, minroot, heads, roots, includepath=False):
                     """return (heads(::(<roots> and <roots>::<heads>)))
                     If includepath is True, return (<roots>::<heads>)."""
                     try:
                         return self.index.reachableroots2(
                             minroot, heads, roots, includepath
                         )
                     except AttributeError:
                         return dagop._reachablerootspure(
                             self.parentrevs, minroot, roots, heads, includepath
                         )
                 def ancestor(self, a, b):
                     """calculate the "best" common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)
                     except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
                         return min(map(self.node, ancs))
                     return self.nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == self.nodeconstants.nodelen:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node)  # quick search the index
                             return node
                         except error.LookupError:
                             pass  # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if b"%d" % rev != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 2 * self.nodeconstants.nodelen:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (binascii.Error, error.LookupError):
                             pass
                 def _partialmatch(self, id):
                     # we don't care wdirfilenodeids as they should be always full hash
                     maybewdir = self.nodeconstants.wdirhex.startswith(id)
                     ambiguous = False
                     try:
                         partial = self.index.partialmatch(id)
                         if partial and self.hasnode(partial):
                             if maybewdir:
                                 # single 'ff...' match in radix tree, ambiguous with wdir
                                 ambiguous = True
                             else:
                                 return partial
                         elif maybewdir:
                             # no 'ff...' match in radix tree, wdir identified
                             raise error.WdirUnsupported
                         else:
                             return None
                     except error.RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fast path: for unfiltered changelog, radix tree is accurate
                         if not getattr(self, 'filteredrevs', None):
                             ambiguous = True
                         # fall through to slow path that filters hidden revisions
                     except (AttributeError, ValueError):
                         # we are pure python, or key is not hex
                         pass
                     if ambiguous:
                         raise error.AmbiguousPrefixLookupError(
                             id, self.display_id, _(b'ambiguous identifier')
                         )
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) <= 40:
                         # hex(node)[:...]
                         l = len(id) // 2 * 2  # grab an even number of digits
                         try:
                             # we're dropping the last digit, so let's check that it's hex,
                             # to avoid the expensive computation below if it's not
                             if len(id) % 2 > 0:
                                 if not (id[-1] in hexdigits):
                                     return None
                             prefix = bin(id[:l])
                         except binascii.Error:
                             pass
                         else:
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [
                                 n for n in nl if hex(n).startswith(id) and self.hasnode(n)
                             ]
                             if self.nodeconstants.nullhex.startswith(id):
                                 nl.append(self.nullid)
                             if len(nl) > 0:
                                 if len(nl) == 1 and not maybewdir:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise error.AmbiguousPrefixLookupError(
                                     id, self.display_id, _(b'ambiguous identifier')
                                 )
                             if maybewdir:
                                 raise error.WdirUnsupported
                             return None
                 def lookup(self, id):
                     """locate a node based on:
                     - revision number or str(revision number)
                     - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise error.LookupError(id, self.display_id, _(b'no match found'))
                 def shortest(self, node, minlength=1):
                     """Find the shortest unambiguous prefix that matches node."""
                     def isvalid(prefix):
                         try:
                             matchednode = self._partialmatch(prefix)
                         except error.AmbiguousPrefixLookupError:
                             return False
                         except error.WdirUnsupported:
                             # single 'ff...' match
                             return True
                         if matchednode is None:
                             raise error.LookupError(node, self.display_id, _(b'no node'))
                         return True
                     def maybewdir(prefix):
                         return all(c == b'f' for c in pycompat.iterbytestr(prefix))
                     hexnode = hex(node)
                     def disambiguate(hexnode, minlength):
                         """Disambiguate against wdirid."""
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if not maybewdir(prefix):
                                 return prefix
                     if not getattr(self, 'filteredrevs', None):
                         try:
                             length = max(self.index.shortest(node), minlength)
                             return disambiguate(hexnode, length)
                         except error.RevlogError:
                             if node != self.nodeconstants.wdirid:
                                 raise error.LookupError(
                                     node, self.display_id, _(b'no node')
                                 )
                         except AttributeError:
                             # Fall through to pure code
                             pass
                     if node == self.nodeconstants.wdirid:
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if isvalid(prefix):
                                 return prefix
                     for length in range(minlength, len(hexnode) + 1):
                         prefix = hexnode[:length]
                         if isvalid(prefix):
                             return disambiguate(hexnode, length)
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return storageutil.hashrevisionsha1(text, p1, p2) != node
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self.delta_config.general_delta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     ret = self._inner.issnapshot(rev)
                     self.issnapshot = self._inner.issnapshot
                     return ret
                 def snapshotdepth(self, rev):
                     """number of snapshot in the chain before this one"""
                     if not self.issnapshot(rev):
                         raise error.ProgrammingError(b'revision %d not a snapshot')
                     return len(self._inner._deltachain(rev)[0]) - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions
                     The delta calculated is in binary form and is intended to be written to
                     revlog data directly. So this function needs raw revision data.
                     """
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return bytes(self._inner._chunk(rev2))
                     return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))
                 def revision(self, nodeorrev):
                     """return an uncompressed revision of a given node or revision
                     number.
                     """
                     return self._revisiondata(nodeorrev)
                 def sidedata(self, nodeorrev):
                     """a map of extra data related to the changeset but not part of the hash
                     This function currently return a dictionary. However, more advanced
                     mapping object will likely be used in the future for a more
                     efficient/lazy code.
                     """
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                     else:
                         rev = self.rev(nodeorrev)
                     return self._sidedata(rev)
                 def _rawtext(self, node, rev):
                     """return the possibly unvalidated rawtext for a revision
                     returns (rev, rawtext, validated)
                     """
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._inner._revisioncache:
                         if self._inner._revisioncache[0] == node:
                             return (rev, self._inner._revisioncache[2], True)
                     if rev is None:
                         rev = self.rev(node)
                     return self._inner.raw_text(node, rev)
                 def _revisiondata(self, nodeorrev, raw=False):
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     # fast path the special `nullid` rev
                     if node == self.nullid:
                         return b""
                     # ``rawtext`` is the text as stored inside the revlog. Might be the
                     # revision or might need to be processed to retrieve the revision.
                     rev, rawtext, validated = self._rawtext(node, rev)
                     if raw and validated:
                         # if we don't want to process the raw text and that raw
                         # text is cached, we can exit early.
                         return rawtext
                     if rev is None:
                         rev = self.rev(node)
                     # the revlog's flag for this revision
                     # (usually alter its state or content)
                     flags = self.flags(rev)
                     if validated and flags == REVIDX_DEFAULT_FLAGS:
                         # no extra flags set, no flag processor runs, text = rawtext
                         return rawtext
                     if raw:
                         validatehash = flagutil.processflagsraw(self, rawtext, flags)
                         text = rawtext
                     else:
                         r = flagutil.processflagsread(self, rawtext, flags)
                         text, validatehash = r
                     if validatehash:
                         self.checkhash(text, node, rev=rev)
                     if not validated:
                         self._inner._revisioncache = (node, rev, rawtext)
                     return text
                 def _sidedata(self, rev):
                     """Return the sidedata for a given revision number."""
                     sidedata_end = None
                     if self._docket is not None:
                         sidedata_end = self._docket.sidedata_end
                     return self._inner.sidedata(rev, sidedata_end)
                 def rawdata(self, nodeorrev):
                     """return an uncompressed raw data of a given node or revision number."""
                     return self._revisiondata(nodeorrev, raw=True)
                 def hash(self, text, p1, p2):
                     """Compute a node hash.
                     Available as a function so that subclasses can replace the hash
                     as needed.
                     """
                     return storageutil.hashrevisionsha1(text, p1, p2)
                 def checkhash(self, text, node, p1=None, p2=None, rev=None):
                     """Check node hash integrity.
                     Available as a function so that subclasses can extend hash mismatch
                     behaviors as needed.
                     """
                     try:
                         if p1 is None and p2 is None:
                             p1, p2 = self.parents(node)
                         if node != self.hash(text, p1, p2):
                             # Clear the revision cache on hash failure. The revision cache
                             # only stores the raw revision and clearing the cache does have
                             # the side-effect that we won't have a cache hit when the raw
                             # revision data is accessed. But this case should be rare and
                             # it is extra work to teach the cache about the hash
                             # verification state.
                             if (
                                 self._inner._revisioncache
                                 and self._inner._revisioncache[0] == node
                             ):
                                 self._inner._revisioncache = None
                             revornode = rev
                             if revornode is None:
                                 revornode = templatefilters.short(hex(node))
                             raise error.RevlogError(
                                 _(b"integrity check failed on %s:%s")
                                 % (self.display_id, pycompat.bytestr(revornode))
                             )
                     except error.RevlogError:
                         if self.feature_config.censorable and storageutil.iscensoredtext(
                             text
                         ):
                             raise error.CensoredNodeError(self.display_id, node, text)
                         raise
                 @property
                 def _split_index_file(self):
                     """the path where to expect the index of an ongoing splitting operation
                     The file will only exist if a splitting operation is in progress, but
                     it is always expected at the same location."""
                     parts = self.radix.split(b'/')
                     if len(parts) > 1:
                         # adds a '-s' prefix to the ``data/` or `meta/` base
                         head = parts[0] + b'-s'
                         mids = parts[1:-1]
                         tail = parts[-1] + b'.i'
                         pieces = [head] + mids + [tail]
                         return b'/'.join(pieces)
                     else:
                         # the revlog is stored at the root of the store (changelog or
                         # manifest), no risk of collision.
                         return self.radix + b'.i.s'
                 def _enforceinlinesize(self, tr, side_write=True):
                     """Check if the revlog is too big for inline and convert if so.
                     This should be called after revisions are added to the revlog. If the
                     revlog has grown too large to be an inline revlog, it will convert it
                     to use multiple index and data files.
                     """
                     tiprev = len(self) - 1
                     total_size = self.start(tiprev) + self.length(tiprev)
                     if not self._inline or total_size < _maxinline:
                         return
                     if self._docket is not None:
                         msg = b"inline revlog should not have a docket"
                         raise error.ProgrammingError(msg)
-                    troffset = tr.findoffset(self._indexfile)
+                    troffset = tr.findoffset(self._inner.canonical_index_file)
                     if troffset is None:
                         raise error.RevlogError(
                             _(b"%s not found in the transaction") % self._indexfile
                         )
                     if troffset:
-                        tr.addbackup(self._indexfile, for_offset=True)
+                        tr.addbackup(self._inner.canonical_index_file, for_offset=True)
                     tr.add(self._datafile, 0)
                     new_index_file_path = None
                     if side_write:
                         old_index_file_path = self._indexfile
                         new_index_file_path = self._split_index_file
                         opener = self.opener
                         weak_self = weakref.ref(self)
                         # the "split" index replace the real index when the transaction is
                         # finalized
                         def finalize_callback(tr):
                             opener.rename(
                                 new_index_file_path,
                                 old_index_file_path,
                                 checkambig=True,
                             )
                             maybe_self = weak_self()
                             if maybe_self is not None:
                                 maybe_self._indexfile = old_index_file_path
                                 maybe_self._inner.index_file = maybe_self._indexfile
                         def abort_callback(tr):
                             maybe_self = weak_self()
                             if maybe_self is not None:
                                 maybe_self._indexfile = old_index_file_path
                                 maybe_self._inner.inline = True
                                 maybe_self._inner.index_file = old_index_file_path
                         tr.registertmp(new_index_file_path)
                         if self.target[1] is not None:
                             callback_id = b'000-revlog-split-%d-%s' % self.target
                         else:
                             callback_id = b'000-revlog-split-%d' % self.target[0]
                         tr.addfinalize(callback_id, finalize_callback)
                         tr.addabort(callback_id, abort_callback)
                     self._format_flags &= ~FLAG_INLINE_DATA
                     self._inner.split_inline(
                         tr,
                         self._format_flags | self._format_version,
                         new_index_file_path=new_index_file_path,
                     )
                     self._inline = False
                     if new_index_file_path is not None:
                         self._indexfile = new_index_file_path
                     nodemaputil.setup_persistent_nodemap(tr, self)
                 def _nodeduplicatecallback(self, transaction, node):
                     """called when trying to add a node already stored."""
                 @contextlib.contextmanager
                 def reading(self):
                     with self._inner.reading():
                         yield
                 @contextlib.contextmanager
                 def _writing(self, transaction):
                     if self._trypending:
                         msg = b'try to write in a `trypending` revlog: %s'
                         msg %= self.display_id
                         raise error.ProgrammingError(msg)
                     if self._inner.is_writing:
                         yield
                     else:
                         data_end = None
                         sidedata_end = None
                         if self._docket is not None:
                             data_end = self._docket.data_end
                             sidedata_end = self._docket.sidedata_end
                         with self._inner.writing(
                             transaction,
                             data_end=data_end,
                             sidedata_end=sidedata_end,
                         ):
                             yield
                             if self._docket is not None:
                                 self._write_docket(transaction)
                 def _write_docket(self, transaction):
                     """write the current docket on disk
                     Exist as a method to help changelog to implement transaction logic
                     We could also imagine using the same transaction logic for all revlog
                     since docket are cheap."""
                     self._docket.write(transaction)
                 def addrevision(
                     self,
                     text,
                     transaction,
                     link,
                     p1,
                     p2,
                     cachedelta=None,
                     node=None,
                     flags=REVIDX_DEFAULT_FLAGS,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     flags - the known flags to set on the revision
                     deltacomputer - an optional deltacomputer instance shared between
                         multiple calls
                     """
                     if link == nullrev:
                         raise error.RevlogError(
                             _(b"attempted to add linkrev -1 to %s") % self.display_id
                         )
                     if sidedata is None:
                         sidedata = {}
                     elif sidedata and not self.feature_config.has_side_data:
                         raise error.ProgrammingError(
                             _(b"trying to add sidedata to a revlog who don't support them")
                         )
                     if flags:
                         node = node or self.hash(text, p1, p2)
                     rawtext, validatehash = flagutil.processflagswrite(self, text, flags)
                     # If the flag processor modifies the revision data, ignore any provided
                     # cachedelta.
                     if rawtext != text:
                         cachedelta = None
                     if len(rawtext) > _maxentrysize:
                         raise error.RevlogError(
                             _(
                                 b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"
                             )
                             % (self.display_id, len(rawtext))
                         )
                     node = node or self.hash(rawtext, p1, p2)
                     rev = self.index.get_rev(node)
                     if rev is not None:
                         return rev
                     if validatehash:
                         self.checkhash(rawtext, node, p1=p1, p2=p2)
                     return self.addrawrevision(
                         rawtext,
                         transaction,
                         link,
                         p1,
                         p2,
                         node,
                         flags,
                         cachedelta=cachedelta,
                         deltacomputer=deltacomputer,
                         sidedata=sidedata,
                     )
                 def addrawrevision(
                     self,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     node,
                     flags,
                     cachedelta=None,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a raw revision with known flags, node and parents
                     useful when reusing a revision not stored in this revlog (ex: received
                     over wire, or read from an external bundle).
                     """
                     with self._writing(transaction):
                         return self._addrevision(
                             node,
                             rawtext,
                             transaction,
                             link,
                             p1,
                             p2,
                             flags,
                             cachedelta,
                             deltacomputer=deltacomputer,
                             sidedata=sidedata,
                         )
                 def compress(self, data):
                     return self._inner.compress(data)
                 def decompress(self, data):
                     return self._inner.decompress(data)
                 def _addrevision(
                     self,
                     node,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     flags,
                     cachedelta,
                     alwayscache=False,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
                     if "deltacomputer" is not provided or None, a defaultdeltacomputer will
                     be used.
                     invariants:
                     - rawtext is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     if node == self.nullid:
                         raise error.RevlogError(
                             _(b"%s: attempt to add null revision") % self.display_id
                         )
                     if (
                         node == self.nodeconstants.wdirid
                         or node in self.nodeconstants.wdirfilenodeids
                     ):
                         raise error.RevlogError(
                             _(b"%s: attempt to add wdir revision") % self.display_id
                         )
                     if self._inner._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     btext = [rawtext]
                     curr = len(self)
                     prev = curr - 1
                     offset = self._get_data_offset(prev)
                     if self._concurrencychecker:
                         ifh, dfh, sdfh = self._inner._writinghandles
                         # XXX no checking for the sidedata file
                         if self._inline:
                             # offset is "as if" it were in the .d file, so we need to add on
                             # the size of the entry metadata.
                             self._concurrencychecker(
                                 ifh, self._indexfile, offset + curr * self.index.entry_size
                             )
                         else:
                             # Entries in the .i are a consistent size.
                             self._concurrencychecker(
                                 ifh, self._indexfile, curr * self.index.entry_size
                             )
                             self._concurrencychecker(dfh, self._datafile, offset)
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if rawtext is None:
                         # need rawtext size, before changed by flag processors, which is
                         # the non-raw size. use revlog explicitly to avoid filelog's extra
                         # logic that might remove metadata size.
                         textlen = mdiff.patchedsize(
                             revlog.size(self, cachedelta[0]), cachedelta[1]
                         )
                     else:
                         textlen = len(rawtext)
                     if deltacomputer is None:
                         write_debug = None
                         if self.delta_config.debug_delta:
                             write_debug = transaction._report
                         deltacomputer = deltautil.deltacomputer(
                             self, write_debug=write_debug
                         )
                     if cachedelta is not None and len(cachedelta) == 2:
                         # If the cached delta has no information about how it should be
                         # reused, add the default reuse instruction according to the
                         # revlog's configuration.
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse = DELTA_BASE_REUSE_NO
                         cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)
                     revinfo = revlogutils.revisioninfo(
                         node,
                         p1,
                         p2,
                         btext,
                         textlen,
                         cachedelta,
                         flags,
                     )
                     deltainfo = deltacomputer.finddeltainfo(revinfo)
                     compression_mode = COMP_MODE_INLINE
                     if self._docket is not None:
                         default_comp = self._docket.default_compression_header
                         r = deltautil.delta_compression(default_comp, deltainfo)
                         compression_mode, deltainfo = r
                     sidedata_compression_mode = COMP_MODE_INLINE
                     if sidedata and self.feature_config.has_side_data:
                         sidedata_compression_mode = COMP_MODE_PLAIN
                         serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)
                         sidedata_offset = self._docket.sidedata_end
                         h, comp_sidedata = self._inner.compress(serialized_sidedata)
                         if (
                             h != b'u'
                             and comp_sidedata[0:1] != b'\0'
                             and len(comp_sidedata) < len(serialized_sidedata)
                         ):
                             assert not h
                             if (
                                 comp_sidedata[0:1]
                                 == self._docket.default_compression_header
                             ):
                                 sidedata_compression_mode = COMP_MODE_DEFAULT
                                 serialized_sidedata = comp_sidedata
                             else:
                                 sidedata_compression_mode = COMP_MODE_INLINE
                                 serialized_sidedata = comp_sidedata
                     else:
                         serialized_sidedata = b""
                         # Don't store the offset if the sidedata is empty, that way
                         # we can easily detect empty sidedata and they will be no different
                         # than ones we manually add.
                         sidedata_offset = 0
                     rank = RANK_UNKNOWN
                     if self.feature_config.compute_rank:
                         if (p1r, p2r) == (nullrev, nullrev):
                             rank = 1
                         elif p1r != nullrev and p2r == nullrev:
                             rank = 1 + self.fast_rank(p1r)
                         elif p1r == nullrev and p2r != nullrev:
                             rank = 1 + self.fast_rank(p2r)
                         else:  # merge node
                             if rustdagop is not None and self.index.rust_ext_compat:
                                 rank = rustdagop.rank(self.index, p1r, p2r)
                             else:
                                 pmin, pmax = sorted((p1r, p2r))
                                 rank = 1 + self.fast_rank(pmax)
                                 rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))
                     e = revlogutils.entry(
                         flags=flags,
                         data_offset=offset,
                         data_compressed_length=deltainfo.deltalen,
                         data_uncompressed_length=textlen,
                         data_compression_mode=compression_mode,
                         data_delta_base=deltainfo.base,
                         link_rev=link,
                         parent_rev_1=p1r,
                         parent_rev_2=p2r,
                         node_id=node,
                         sidedata_offset=sidedata_offset,
                         sidedata_compressed_length=len(serialized_sidedata),
                         sidedata_compression_mode=sidedata_compression_mode,
                         rank=rank,
                     )
                     self.index.append(e)
                     entry = self.index.entry_binary(curr)
                     if curr == 0 and self._docket is None:
                         header = self._format_flags | self._format_version
                         header = self.index.pack_header(header)
                         entry = header + entry
                     self._writeentry(
                         transaction,
                         entry,
                         deltainfo.data,
                         link,
                         offset,
                         serialized_sidedata,
                         sidedata_offset,
                     )
                     rawtext = btext[0]
                     if alwayscache and rawtext is None:
                         rawtext = deltacomputer.buildtext(revinfo)
                     if type(rawtext) == bytes:  # only accept immutable objects
                         self._inner._revisioncache = (node, curr, rawtext)
                     self._chainbasecache[curr] = deltainfo.chainbase
                     return curr
                 def _get_data_offset(self, prev):
                     """Returns the current offset in the (in-transaction) data file.
                     Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket
                     file to store that information: since sidedata can be rewritten to the
                     end of the data file within a transaction, you can have cases where, for
                     example, rev `n` does not have sidedata while rev `n - 1` does, leading
                     to `n - 1`'s sidedata being written after `n`'s data.
                     TODO cache this in a docket file before getting out of experimental."""
                     if self._docket is None:
                         return self.end(prev)
                     else:
                         return self._docket.data_end
                 def _writeentry(
                     self,
                     transaction,
                     entry,
                     data,
                     link,
                     offset,
                     sidedata,
                     sidedata_offset,
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     index_end = data_end = sidedata_end = None
                     if self._docket is not None:
                         index_end = self._docket.index_end
                         data_end = self._docket.data_end
                         sidedata_end = self._docket.sidedata_end
                     files_end = self._inner.write_entry(
                         transaction,
                         entry,
                         data,
                         link,
                         offset,
                         sidedata,
                         sidedata_offset,
                         index_end,
                         data_end,
                         sidedata_end,
                     )
                     self._enforceinlinesize(transaction)
                     if self._docket is not None:
                         self._docket.index_end = files_end[0]
                         self._docket.data_end = files_end[1]
                         self._docket.sidedata_end = files_end[2]
                     nodemaputil.setup_persistent_nodemap(transaction, self)
                 def addgroup(
                     self,
                     deltas,
                     linkmapper,
                     transaction,
                     alwayscache=False,
                     addrevisioncb=None,
                     duplicaterevisioncb=None,
                     debug_info=None,
                     delta_base_reuse_policy=None,
                 ):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     If ``addrevisioncb`` is defined, it will be called with arguments of
                     this revlog and the node that was added.
                     """
                     if self._adding_group:
                         raise error.ProgrammingError(b'cannot nest addgroup() calls')
                     # read the default delta-base reuse policy from revlog config if the
                     # group did not specify one.
                     if delta_base_reuse_policy is None:
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse_policy = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse_policy = DELTA_BASE_REUSE_NO
                     self._adding_group = True
                     empty = True
                     try:
                         with self._writing(transaction):
                             write_debug = None
                             if self.delta_config.debug_delta:
                                 write_debug = transaction._report
                             deltacomputer = deltautil.deltacomputer(
                                 self,
                                 write_debug=write_debug,
                                 debug_info=debug_info,
                             )
                             # loop through our set of deltas
                             for data in deltas:
                                 (
                                     node,
                                     p1,
                                     p2,
                                     linknode,
                                     deltabase,
                                     delta,
                                     flags,
                                     sidedata,
                                 ) = data
                                 link = linkmapper(linknode)
                                 flags = flags or REVIDX_DEFAULT_FLAGS
                                 rev = self.index.get_rev(node)
                                 if rev is not None:
                                     # this can happen if two branches make the same change
                                     self._nodeduplicatecallback(transaction, rev)
                                     if duplicaterevisioncb:
                                         duplicaterevisioncb(self, rev)
                                     empty = False
                                     continue
                                 for p in (p1, p2):
                                     if not self.index.has_node(p):
                                         raise error.LookupError(
                                             p, self.radix, _(b'unknown parent')
                                         )
                                 if not self.index.has_node(deltabase):
                                     raise error.LookupError(
                                         deltabase, self.display_id, _(b'unknown delta base')
                                     )
                                 baserev = self.rev(deltabase)
                                 if baserev != nullrev and self.iscensored(baserev):
                                     # if base is censored, delta must be full replacement in a
                                     # single patch operation
                                     hlen = struct.calcsize(b">lll")
                                     oldlen = self.rawsize(baserev)
                                     newlen = len(delta) - hlen
                                     if delta[:hlen] != mdiff.replacediffheader(
                                         oldlen, newlen
                                     ):
                                         raise error.CensoredBaseError(
                                             self.display_id, self.node(baserev)
                                         )
                                 if not flags and self._peek_iscensored(baserev, delta):
                                     flags |= REVIDX_ISCENSORED
                                 # We assume consumers of addrevisioncb will want to retrieve
                                 # the added revision, which will require a call to
                                 # revision(). revision() will fast path if there is a cache
                                 # hit. So, we tell _addrevision() to always cache in this case.
                                 # We're only using addgroup() in the context of changegroup
                                 # generation so the revision data can always be handled as raw
                                 # by the flagprocessor.
                                 rev = self._addrevision(
                                     node,
                                     None,
                                     transaction,
                                     link,
                                     p1,
                                     p2,
                                     flags,
                                     (baserev, delta, delta_base_reuse_policy),
                                     alwayscache=alwayscache,
                                     deltacomputer=deltacomputer,
                                     sidedata=sidedata,
                                 )
                                 if addrevisioncb:
                                     addrevisioncb(self, rev)
                                 empty = False
                     finally:
                         self._adding_group = False
                     return not empty
                 def iscensored(self, rev):
                     """Check if a file revision is censored."""
                     if not self.feature_config.censorable:
                         return False
                     return self.flags(rev) & REVIDX_ISCENSORED
                 def _peek_iscensored(self, baserev, delta):
                     """Quickly check if a delta produces a censored revision."""
                     if not self.feature_config.censorable:
                         return False
                     return storageutil.deltaiscensored(delta, baserev, self.rawsize)
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     return storageutil.resolvestripinfo(
                         minlink,
                         len(self) - 1,
                         self.headrevs(),
                         self.linkrev,
                         self.parentrevs,
                     )
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     data_end = self.start(rev)
                     if not self._inline:
                         transaction.add(self._datafile, data_end)
                         end = rev * self.index.entry_size
                     else:
                         end = data_end + (rev * self.index.entry_size)
                     if self._sidedatafile:
                         sidedata_end = self.sidedata_cut_off(rev)
                         transaction.add(self._sidedatafile, sidedata_end)
                     transaction.add(self._indexfile, end)
                     if self._docket is not None:
                         # XXX we could, leverage the docket while stripping. However it is
                         # not powerfull enough at the time of this comment
                         self._docket.index_end = end
                         self._docket.data_end = data_end
                         self._docket.sidedata_end = sidedata_end
                         self._docket.write(transaction, stripping=True)
                     # then reset internal state in memory to forget those revisions
                     self._chaininfocache = util.lrucachedict(500)
                     self._inner.clear_cache()
                     del self.index[rev:-1]
                 def checksize(self):
                     """Check size of index and data files
                     return a (dd, di) tuple.
                     - dd: extra bytes for the "data" file
                     - di: extra bytes for the "index" file
                     A healthy revlog will return (0, 0).
                     """
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         with self._datafp() as f:
                             f.seek(0, io.SEEK_END)
                             actual = f.tell()
                         dd = actual - expected
                     except FileNotFoundError:
                         dd = 0
                     try:
                         f = self.opener(self._indexfile)
                         f.seek(0, io.SEEK_END)
                         actual = f.tell()
                         f.close()
                         s = self.index.entry_size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except FileNotFoundError:
                         di = 0
                     return (dd, di)
                 def files(self):
                     """return list of files that compose this revlog"""
                     res = [self._indexfile]
                     if self._docket_file is None:
                         if not self._inline:
                             res.append(self._datafile)
                     else:
                         res.append(self._docket_file)
                         res.extend(self._docket.old_index_filepaths(include_empty=False))
                         if self._docket.data_end:
                             res.append(self._datafile)
                         res.extend(self._docket.old_data_filepaths(include_empty=False))
                         if self._docket.sidedata_end:
                             res.append(self._sidedatafile)
                         res.extend(self._docket.old_sidedata_filepaths(include_empty=False))
                     return res
                 def emitrevisions(
                     self,
                     nodes,
                     nodesorder=None,
                     revisiondata=False,
                     assumehaveparentrevisions=False,
                     deltamode=repository.CG_DELTAMODE_STD,
                     sidedata_helpers=None,
                     debug_info=None,
                 ):
                     if nodesorder not in (b'nodes', b'storage', b'linear', None):
                         raise error.ProgrammingError(
                             b'unhandled value for nodesorder: %s' % nodesorder
                         )
                     if nodesorder is None and not self.delta_config.general_delta:
                         nodesorder = b'storage'
                     if (
                         not self._storedeltachains
                         and deltamode != repository.CG_DELTAMODE_PREV
                     ):
                         deltamode = repository.CG_DELTAMODE_FULL
                     return storageutil.emitrevisions(
                         self,
                         nodes,
                         nodesorder,
                         revlogrevisiondelta,
                         deltaparentfn=self.deltaparent,
                         candeltafn=self._candelta,
                         rawsizefn=self.rawsize,
                         revdifffn=self.revdiff,
                         flagsfn=self.flags,
                         deltamode=deltamode,
                         revisiondata=revisiondata,
                         assumehaveparentrevisions=assumehaveparentrevisions,
                         sidedata_helpers=sidedata_helpers,
                         debug_info=debug_info,
                     )
                 DELTAREUSEALWAYS = b'always'
                 DELTAREUSESAMEREVS = b'samerevs'
                 DELTAREUSENEVER = b'never'
                 DELTAREUSEFULLADD = b'fulladd'
                 DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}
                 def clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb=None,
                     deltareuse=DELTAREUSESAMEREVS,
                     forcedeltabothparents=None,
                     sidedata_helpers=None,
                 ):
                     """Copy this revlog to another, possibly with format changes.
                     The destination revlog will contain the same revisions and nodes.
                     However, it may not be bit-for-bit identical due to e.g. delta encoding
                     differences.
                     The ``deltareuse`` argument control how deltas from the existing revlog
                     are preserved in the destination revlog. The argument can have the
                     following values:
                     DELTAREUSEALWAYS
                        Deltas will always be reused (if possible), even if the destination
                        revlog would not select the same revisions for the delta. This is the
                        fastest mode of operation.
                     DELTAREUSESAMEREVS
                        Deltas will be reused if the destination revlog would pick the same
                        revisions for the delta. This mode strikes a balance between speed
                        and optimization.
                     DELTAREUSENEVER
                        Deltas will never be reused. This is the slowest mode of execution.
                        This mode can be used to recompute deltas (e.g. if the diff/delta
                        algorithm changes).
                     DELTAREUSEFULLADD
                        Revision will be re-added as if their were new content. This is
                        slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.
                        eg: large file detection and handling.
                     Delta computation can be slow, so the choice of delta reuse policy can
                     significantly affect run time.
                     The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
                     two extremes. Deltas will be reused if they are appropriate. But if the
                     delta could choose a better revision, it will do so. This means if you
                     are converting a non-generaldelta revlog to a generaldelta revlog,
                     deltas will be recomputed if the delta's parent isn't a parent of the
                     revision.
                     In addition to the delta policy, the ``forcedeltabothparents``
                     argument controls whether to force compute deltas against both parents
                     for merges. By default, the current default is used.
                     See `revlogutil.sidedata.get_sidedata_helpers` for the doc on
                     `sidedata_helpers`.
                     """
                     if deltareuse not in self.DELTAREUSEALL:
                         raise ValueError(
                             _(b'value for deltareuse invalid: %s') % deltareuse
                         )
                     if len(destrevlog):
                         raise ValueError(_(b'destination revlog is not empty'))
                     if getattr(self, 'filteredrevs', None):
                         raise ValueError(_(b'source revlog has filtered revisions'))
                     if getattr(destrevlog, 'filteredrevs', None):
                         raise ValueError(_(b'destination revlog has filtered revisions'))
                     # lazydelta and lazydeltabase controls whether to reuse a cached delta,
                     # if possible.
                     old_delta_config = destrevlog.delta_config
                     destrevlog.delta_config = destrevlog.delta_config.copy()
                     try:
                         if deltareuse == self.DELTAREUSEALWAYS:
                             destrevlog.delta_config.lazy_delta_base = True
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSESAMEREVS:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSENEVER:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = False
                         delta_both_parents = (
                             forcedeltabothparents or old_delta_config.delta_both_parents
                         )
                         destrevlog.delta_config.delta_both_parents = delta_both_parents
                         with self.reading(), destrevlog._writing(tr):
                             self._clone(
                                 tr,
                                 destrevlog,
                                 addrevisioncb,
                                 deltareuse,
                                 forcedeltabothparents,
                                 sidedata_helpers,
                             )
                     finally:
                         destrevlog.delta_config = old_delta_config
                 def _clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb,
                     deltareuse,
                     forcedeltabothparents,
                     sidedata_helpers,
                 ):
                     """perform the core duty of `revlog.clone` after parameter processing"""
                     write_debug = None
                     if self.delta_config.debug_delta:
                         write_debug = tr._report
                     deltacomputer = deltautil.deltacomputer(
                         destrevlog,
                         write_debug=write_debug,
                     )
                     index = self.index
                     for rev in self:
                         entry = index[rev]
                         # Some classes override linkrev to take filtered revs into
                         # account. Use raw entry from index.
                         flags = entry[0] & 0xFFFF
                         linkrev = entry[4]
                         p1 = index[entry[5]][7]
                         p2 = index[entry[6]][7]
                         node = entry[7]
                         # (Possibly) reuse the delta from the revlog if allowed and
                         # the revlog chunk is a delta.
                         cachedelta = None
                         rawtext = None
                         if deltareuse == self.DELTAREUSEFULLADD:
                             text = self._revisiondata(rev)
                             sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             destrevlog.addrevision(
                                 text,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 cachedelta=cachedelta,
                                 node=node,
                                 flags=flags,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         else:
                             if destrevlog.delta_config.lazy_delta:
                                 dp = self.deltaparent(rev)
                                 if dp != nullrev:
                                     cachedelta = (dp, bytes(self._inner._chunk(rev)))
                             sidedata = None
                             if not cachedelta:
                                 try:
                                     rawtext = self._revisiondata(rev)
                                 except error.CensoredNodeError as censored:
                                     assert flags & REVIDX_ISCENSORED
                                     rawtext = censored.tombstone
                                 sidedata = self.sidedata(rev)
                             if sidedata is None:
                                 sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             destrevlog._addrevision(
                                 node,
                                 rawtext,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 flags,
                                 cachedelta,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         if addrevisioncb:
                             addrevisioncb(self, rev, node)
                 def censorrevision(self, tr, censornode, tombstone=b''):
                     if self._format_version == REVLOGV0:
                         raise error.RevlogError(
                             _(b'cannot censor with version %d revlogs')
                             % self._format_version
                         )
                     elif self._format_version == REVLOGV1:
                         rewrite.v1_censor(self, tr, censornode, tombstone)
                     else:
                         rewrite.v2_censor(self, tr, censornode, tombstone)
                 def verifyintegrity(self, state):
                     """Verifies the integrity of the revlog.
                     Yields ``revlogproblem`` instances describing problems that are
                     found.
                     """
                     dd, di = self.checksize()
                     if dd:
                         yield revlogproblem(error=_(b'data length off by %d bytes') % dd)
                     if di:
                         yield revlogproblem(error=_(b'index contains %d extra bytes') % di)
                     version = self._format_version
                     # The verifier tells us what version revlog we should be.
                     if version != state[b'expectedversion']:
                         yield revlogproblem(
                             warning=_(b"warning: '%s' uses revlog format %d; expected %d")
                             % (self.display_id, version, state[b'expectedversion'])
                         )
                     state[b'skipread'] = set()
                     state[b'safe_renamed'] = set()
                     for rev in self:
                         node = self.node(rev)
                         # Verify contents. 4 cases to care about:
                         #
                         #   common: the most common case
                         #   rename: with a rename
                         #   meta: file content starts with b'\1\n', the metadata
                         #         header defined in filelog.py, but without a rename
                         #   ext: content stored externally
                         #
                         # More formally, their differences are shown below:
                         #
                         #                       | common | rename | meta  | ext
                         #  -------------------------------------------------------
                         #   flags()             | 0      | 0      | 0     | not 0
                         #   renamed()           | False  | True   | False | ?
                         #   rawtext[0:2]=='\1\n'| False  | True   | True  | ?
                         #
                         # "rawtext" means the raw text stored in revlog data, which
                         # could be retrieved by "rawdata(rev)". "text"
                         # mentioned below is "revision(rev)".
                         #
                         # There are 3 different lengths stored physically:
                         #  1. L1: rawsize, stored in revlog index
                         #  2. L2: len(rawtext), stored in revlog data
                         #  3. L3: len(text), stored in revlog data if flags==0, or
                         #     possibly somewhere else if flags!=0
                         #
                         # L1 should be equal to L2. L3 could be different from them.
                         # "text" may or may not affect commit hash depending on flag
                         # processors (see flagutil.addflagprocessor).
                         #
                         #              | common  | rename | meta  | ext
                         # -------------------------------------------------
                         #    rawsize() | L1      | L1     | L1    | L1
                         #       size() | L1      | L2-LM  | L1(*) | L1 (?)
                         # len(rawtext) | L2      | L2     | L2    | L2
                         #    len(text) | L2      | L2     | L2    | L3
                         #  len(read()) | L2      | L2-LM  | L2-LM | L3 (?)
                         #
                         # LM:  length of metadata, depending on rawtext
                         # (*): not ideal, see comment in filelog.size
                         # (?): could be "- len(meta)" if the resolved content has
                         #      rename metadata
                         #
                         # Checks needed to be done:
                         #  1. length check: L1 == L2, in all cases.
                         #  2. hash check: depending on flag processor, we may need to
                         #     use either "text" (external), or "rawtext" (in revlog).
                         try:
                             skipflags = state.get(b'skipflags', 0)
                             if skipflags:
                                 skipflags &= self.flags(rev)
                             _verify_revision(self, skipflags, state, node)
                             l1 = self.rawsize(rev)
                             l2 = len(self.rawdata(node))
                             if l1 != l2:
                                 yield revlogproblem(
                                     error=_(b'unpacked size is %d, %d expected') % (l2, l1),
                                     node=node,
                                 )
                         except error.CensoredNodeError:
                             if state[b'erroroncensored']:
                                 yield revlogproblem(
                                     error=_(b'censored file data'), node=node
                                 )
                                 state[b'skipread'].add(node)
                         except Exception as e:
                             yield revlogproblem(
                                 error=_(b'unpacking %s: %s')
                                 % (short(node), stringutil.forcebytestr(e)),
                                 node=node,
                             )
                             state[b'skipread'].add(node)
                 def storageinfo(
                     self,
                     exclusivefiles=False,
                     sharedfiles=False,
                     revisionscount=False,
                     trackedsize=False,
                     storedsize=False,
                 ):
                     d = {}
                     if exclusivefiles:
                         d[b'exclusivefiles'] = [(self.opener, self._indexfile)]
                         if not self._inline:
                             d[b'exclusivefiles'].append((self.opener, self._datafile))
                     if sharedfiles:
                         d[b'sharedfiles'] = []
                     if revisionscount:
                         d[b'revisionscount'] = len(self)
                     if trackedsize:
                         d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))
                     if storedsize:
                         d[b'storedsize'] = sum(
                             self.opener.stat(path).st_size for path in self.files()
                         )
                     return d
                 def rewrite_sidedata(self, transaction, helpers, startrev, endrev):
                     if not self.feature_config.has_side_data:
                         return
                     # revlog formats with sidedata support does not support inline
                     assert not self._inline
                     if not helpers[1] and not helpers[2]:
                         # Nothing to generate or remove
                         return
                     new_entries = []
                     # append the new sidedata
                     with self._writing(transaction):
                         ifh, dfh, sdfh = self._inner._writinghandles
                         dfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                         current_offset = sdfh.tell()
                         for rev in range(startrev, endrev + 1):
                             entry = self.index[rev]
                             new_sidedata, flags = sidedatautil.run_sidedata_helpers(
                                 store=self,
                                 sidedata_helpers=helpers,
                                 sidedata={},
                                 rev=rev,
                             )
                             serialized_sidedata = sidedatautil.serialize_sidedata(
                                 new_sidedata
                             )
                             sidedata_compression_mode = COMP_MODE_INLINE
                             if serialized_sidedata and self.feature_config.has_side_data:
                                 sidedata_compression_mode = COMP_MODE_PLAIN
                                 h, comp_sidedata = self._inner.compress(serialized_sidedata)
                                 if (
                                     h != b'u'
                                     and comp_sidedata[0] != b'\0'
                                     and len(comp_sidedata) < len(serialized_sidedata)
                                 ):
                                     assert not h
                                     if (
                                         comp_sidedata[0]
                                         == self._docket.default_compression_header
                                     ):
                                         sidedata_compression_mode = COMP_MODE_DEFAULT
                                         serialized_sidedata = comp_sidedata
                                     else:
                                         sidedata_compression_mode = COMP_MODE_INLINE
                                         serialized_sidedata = comp_sidedata
                             if entry[8] != 0 or entry[9] != 0:
                                 # rewriting entries that already have sidedata is not
                                 # supported yet, because it introduces garbage data in the
                                 # revlog.
                                 msg = b"rewriting existing sidedata is not supported yet"
                                 raise error.Abort(msg)
                             # Apply (potential) flags to add and to remove after running
                             # the sidedata helpers
                             new_offset_flags = entry[0] | flags[0] & ~flags[1]
                             entry_update = (
                                 current_offset,
                                 len(serialized_sidedata),
                                 new_offset_flags,
                                 sidedata_compression_mode,
                             )
                             # the sidedata computation might have move the file cursors around
                             sdfh.seek(current_offset, os.SEEK_SET)
                             sdfh.write(serialized_sidedata)
                             new_entries.append(entry_update)
                             current_offset += len(serialized_sidedata)
                             self._docket.sidedata_end = sdfh.tell()
                         # rewrite the new index entries
                         ifh.seek(startrev * self.index.entry_size)
                         for i, e in enumerate(new_entries):
                             rev = startrev + i
                             self.index.replace_sidedata_info(rev, *e)
                             packed = self.index.entry_binary(rev)
                             if rev == 0 and self._docket is None:
                                 header = self._format_flags | self._format_version
                                 header = self.index.pack_header(header)
                                 packed = header + packed
                             ifh.write(packed)