upstream/mercurial-mirror Commit - r51943:0d33f4b0

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

# coding: utf8

2

# coding: utf8

3

#

3

#

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

"""Storage back-end for Mercurial.

9

"""Storage back-end for Mercurial.

10

11

This provides efficient delta storage with O(1) retrieve and append

11

This provides efficient delta storage with O(1) retrieve and append

12

and O(changes) merge between branches.

12

and O(changes) merge between branches.

13

"""

13

"""

14

15

16

import binascii

16

import binascii

17

import collections

17

import collections

18

import contextlib

18

import contextlib

19

import io

19

import io

20

import os

20

import os

21

import struct

21

import struct

22

import weakref

22

import weakref

23

import zlib

23

import zlib

24

25

# import stuff from node for others to import from revlog

25

# import stuff from node for others to import from revlog

26

from .node import (

26

from .node import (

27

bin,

27

bin,

28

hex,

28

hex,

29

nullrev,

29

nullrev,

30

sha1nodeconstants,

30

sha1nodeconstants,

31

short,

31

short,

32

wdirrev,

32

wdirrev,

33

)

33

)

34

from .i18n import _

34

from .i18n import _

35

from .revlogutils.constants import (

35

from .revlogutils.constants import (

36

ALL_KINDS,

36

ALL_KINDS,

37

CHANGELOGV2,

37

CHANGELOGV2,

38

COMP_MODE_DEFAULT,

38

COMP_MODE_DEFAULT,

39

COMP_MODE_INLINE,

39

COMP_MODE_INLINE,

40

COMP_MODE_PLAIN,

40

COMP_MODE_PLAIN,

41

DELTA_BASE_REUSE_NO,

41

DELTA_BASE_REUSE_NO,

42

DELTA_BASE_REUSE_TRY,

42

DELTA_BASE_REUSE_TRY,

43

ENTRY_RANK,

43

ENTRY_RANK,

44

FEATURES_BY_VERSION,

44

FEATURES_BY_VERSION,

45

FLAG_GENERALDELTA,

45

FLAG_GENERALDELTA,

46

FLAG_INLINE_DATA,

46

FLAG_INLINE_DATA,

47

INDEX_HEADER,

47

INDEX_HEADER,

48

KIND_CHANGELOG,

48

KIND_CHANGELOG,

49

KIND_FILELOG,

49

KIND_FILELOG,

50

RANK_UNKNOWN,

50

RANK_UNKNOWN,

51

REVLOGV0,

51

REVLOGV0,

52

REVLOGV1,

52

REVLOGV1,

53

REVLOGV1_FLAGS,

53

REVLOGV1_FLAGS,

54

REVLOGV2,

54

REVLOGV2,

55

REVLOGV2_FLAGS,

55

REVLOGV2_FLAGS,

56

REVLOG_DEFAULT_FLAGS,

56

REVLOG_DEFAULT_FLAGS,

57

REVLOG_DEFAULT_FORMAT,

57

REVLOG_DEFAULT_FORMAT,

58

REVLOG_DEFAULT_VERSION,

58

REVLOG_DEFAULT_VERSION,

59

SUPPORTED_FLAGS,

59

SUPPORTED_FLAGS,

60

)

60

)

61

from .revlogutils.flagutil import (

61

from .revlogutils.flagutil import (

62

REVIDX_DEFAULT_FLAGS,

62

REVIDX_DEFAULT_FLAGS,

63

REVIDX_ELLIPSIS,

63

REVIDX_ELLIPSIS,

64

REVIDX_EXTSTORED,

64

REVIDX_EXTSTORED,

65

REVIDX_FLAGS_ORDER,

65

REVIDX_FLAGS_ORDER,

66

REVIDX_HASCOPIESINFO,

66

REVIDX_HASCOPIESINFO,

67

REVIDX_ISCENSORED,

67

REVIDX_ISCENSORED,

68

REVIDX_RAWTEXT_CHANGING_FLAGS,

68

REVIDX_RAWTEXT_CHANGING_FLAGS,

69

)

69

)

70

from .thirdparty import attr

70

from .thirdparty import attr

71

from . import (

71

from . import (

72

ancestor,

72

ancestor,

73

dagop,

73

dagop,

74

error,

74

error,

75

mdiff,

75

mdiff,

76

policy,

76

policy,

77

pycompat,

77

pycompat,

78

revlogutils,

78

revlogutils,

79

templatefilters,

79

templatefilters,

80

util,

80

util,

81

)

81

)

82

from .interfaces import (

82

from .interfaces import (

83

repository,

83

repository,

84

util as interfaceutil,

84

util as interfaceutil,

85

)

85

)

86

from .revlogutils import (

86

from .revlogutils import (

87

deltas as deltautil,

87

deltas as deltautil,

88

docket as docketutil,

88

docket as docketutil,

89

flagutil,

89

flagutil,

90

nodemap as nodemaputil,

90

nodemap as nodemaputil,

91

randomaccessfile,

91

randomaccessfile,

92

revlogv0,

92

revlogv0,

93

rewrite,

93

rewrite,

94

sidedata as sidedatautil,

94

sidedata as sidedatautil,

95

)

95

)

96

from .utils import (

96

from .utils import (

97

storageutil,

97

storageutil,

98

stringutil,

98

stringutil,

99

)

99

)

100

101

# blanked usage of all the name to prevent pyflakes constraints

101

# blanked usage of all the name to prevent pyflakes constraints

102

# We need these name available in the module for extensions.

102

# We need these name available in the module for extensions.

103

104

REVLOGV0

104

REVLOGV0

105

REVLOGV1

105

REVLOGV1

106

REVLOGV2

106

REVLOGV2

107

CHANGELOGV2

107

CHANGELOGV2

108

FLAG_INLINE_DATA

108

FLAG_INLINE_DATA

109

FLAG_GENERALDELTA

109

FLAG_GENERALDELTA

110

REVLOG_DEFAULT_FLAGS

110

REVLOG_DEFAULT_FLAGS

111

REVLOG_DEFAULT_FORMAT

111

REVLOG_DEFAULT_FORMAT

112

REVLOG_DEFAULT_VERSION

112

REVLOG_DEFAULT_VERSION

113

REVLOGV1_FLAGS

113

REVLOGV1_FLAGS

114

REVLOGV2_FLAGS

114

REVLOGV2_FLAGS

115

REVIDX_ISCENSORED

115

REVIDX_ISCENSORED

116

REVIDX_ELLIPSIS

116

REVIDX_ELLIPSIS

117

REVIDX_HASCOPIESINFO

117

REVIDX_HASCOPIESINFO

118

REVIDX_EXTSTORED

118

REVIDX_EXTSTORED

119

REVIDX_DEFAULT_FLAGS

119

REVIDX_DEFAULT_FLAGS

120

REVIDX_FLAGS_ORDER

120

REVIDX_FLAGS_ORDER

121

REVIDX_RAWTEXT_CHANGING_FLAGS

121

REVIDX_RAWTEXT_CHANGING_FLAGS

122

123

parsers = policy.importmod('parsers')

123

parsers = policy.importmod('parsers')

124

rustancestor = policy.importrust('ancestor')

124

rustancestor = policy.importrust('ancestor')

125

rustdagop = policy.importrust('dagop')

125

rustdagop = policy.importrust('dagop')

126

rustrevlog = policy.importrust('revlog')

126

rustrevlog = policy.importrust('revlog')

127

128

# Aliased for performance.

128

# Aliased for performance.

129

_zlibdecompress = zlib.decompress

129

_zlibdecompress = zlib.decompress

130

131

# max size of inline data embedded into a revlog

131

# max size of inline data embedded into a revlog

132

_maxinline = 131072

132

_maxinline = 131072

133

134

# Flag processors for REVIDX_ELLIPSIS.

134

# Flag processors for REVIDX_ELLIPSIS.

135

def ellipsisreadprocessor(rl, text):

135

def ellipsisreadprocessor(rl, text):

136

return text, False

136

return text, False

137

138

139

def ellipsiswriteprocessor(rl, text):

139

def ellipsiswriteprocessor(rl, text):

140

return text, False

140

return text, False

141

142

143

def ellipsisrawprocessor(rl, text):

143

def ellipsisrawprocessor(rl, text):

144

return False

144

return False

145

146

147

ellipsisprocessor = (

147

ellipsisprocessor = (

148

ellipsisreadprocessor,

148

ellipsisreadprocessor,

149

ellipsiswriteprocessor,

149

ellipsiswriteprocessor,

150

ellipsisrawprocessor,

150

ellipsisrawprocessor,

151

)

151

)

152

153

154

def _verify_revision(rl, skipflags, state, node):

154

def _verify_revision(rl, skipflags, state, node):

155

"""Verify the integrity of the given revlog ``node`` while providing a hook

155

"""Verify the integrity of the given revlog ``node`` while providing a hook

156

point for extensions to influence the operation."""

156

point for extensions to influence the operation."""

157

if skipflags:

157

if skipflags:

158

state[b'skipread'].add(node)

158

state[b'skipread'].add(node)

159

else:

159

else:

160

# Side-effect: read content and verify hash.

160

# Side-effect: read content and verify hash.

161

rl.revision(node)

161

rl.revision(node)

162

163

164

# True if a fast implementation for persistent-nodemap is available

164

# True if a fast implementation for persistent-nodemap is available

165

#

165

#

166

# We also consider we have a "fast" implementation in "pure" python because

166

# We also consider we have a "fast" implementation in "pure" python because

167

# people using pure don't really have performance consideration (and a

167

# people using pure don't really have performance consideration (and a

168

# wheelbarrow of other slowness source)

168

# wheelbarrow of other slowness source)

169

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

169

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

170

parsers, 'BaseIndexObject'

170

parsers, 'BaseIndexObject'

171

)

171

)

172

173

174

@interfaceutil.implementer(repository.irevisiondelta)

174

@interfaceutil.implementer(repository.irevisiondelta)

175

@attr.s(slots=True)

175

@attr.s(slots=True)

176

class revlogrevisiondelta:

176

class revlogrevisiondelta:

177

node = attr.ib()

177

node = attr.ib()

178

p1node = attr.ib()

178

p1node = attr.ib()

179

p2node = attr.ib()

179

p2node = attr.ib()

180

basenode = attr.ib()

180

basenode = attr.ib()

181

flags = attr.ib()

181

flags = attr.ib()

182

baserevisionsize = attr.ib()

182

baserevisionsize = attr.ib()

183

revision = attr.ib()

183

revision = attr.ib()

184

delta = attr.ib()

184

delta = attr.ib()

185

sidedata = attr.ib()

185

sidedata = attr.ib()

186

protocol_flags = attr.ib()

186

protocol_flags = attr.ib()

187

linknode = attr.ib(default=None)

187

linknode = attr.ib(default=None)

188

189

190

@interfaceutil.implementer(repository.iverifyproblem)

190

@interfaceutil.implementer(repository.iverifyproblem)

191

@attr.s(frozen=True)

191

@attr.s(frozen=True)

192

class revlogproblem:

192

class revlogproblem:

193

warning = attr.ib(default=None)

193

warning = attr.ib(default=None)

194

error = attr.ib(default=None)

194

error = attr.ib(default=None)

195

node = attr.ib(default=None)

195

node = attr.ib(default=None)

196

197

198

def parse_index_v1(data, inline):

198

def parse_index_v1(data, inline):

199

# call the C implementation to parse the index data

199

# call the C implementation to parse the index data

200

index, cache = parsers.parse_index2(data, inline)

200

index, cache = parsers.parse_index2(data, inline)

201

return index, cache

201

return index, cache

202

203

204

def parse_index_v2(data, inline):

204

def parse_index_v2(data, inline):

205

# call the C implementation to parse the index data

205

# call the C implementation to parse the index data

206

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

206

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

207

return index, cache

207

return index, cache

208

209

210

def parse_index_cl_v2(data, inline):

210

def parse_index_cl_v2(data, inline):

211

# call the C implementation to parse the index data

211

# call the C implementation to parse the index data

212

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

212

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

213

return index, cache

213

return index, cache

214

215

216

if hasattr(parsers, 'parse_index_devel_nodemap'):

216

if hasattr(parsers, 'parse_index_devel_nodemap'):

217

218

def parse_index_v1_nodemap(data, inline):

218

def parse_index_v1_nodemap(data, inline):

219

index, cache = parsers.parse_index_devel_nodemap(data, inline)

219

index, cache = parsers.parse_index_devel_nodemap(data, inline)

220

return index, cache

220

return index, cache

221

222

223

else:

223

else:

224

parse_index_v1_nodemap = None

224

parse_index_v1_nodemap = None

225

226

227

def parse_index_v1_mixed(data, inline):

227

def parse_index_v1_mixed(data, inline):

228

index, cache = parse_index_v1(data, inline)

228

index, cache = parse_index_v1(data, inline)

229

return rustrevlog.MixedIndex(index), cache

229

return rustrevlog.MixedIndex(index), cache

230

231

232

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

232

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

233

# signed integer)

233

# signed integer)

234

_maxentrysize = 0x7FFFFFFF

234

_maxentrysize = 0x7FFFFFFF

235

236

FILE_TOO_SHORT_MSG = _(

236

FILE_TOO_SHORT_MSG = _(

237

b'cannot read from revlog %s;'

237

b'cannot read from revlog %s;'

238

b' expected %d bytes from offset %d, data size is %d'

238

b' expected %d bytes from offset %d, data size is %d'

239

)

239

)

240

241

hexdigits = b'0123456789abcdefABCDEF'

241

hexdigits = b'0123456789abcdefABCDEF'

242

243

244

class _Config:

244

class _Config:

245

def copy(self):

245

def copy(self):

246

return self.__class__(**self.__dict__)

246

return self.__class__(**self.__dict__)

247

248

249

@attr.s()

249

@attr.s()

250

class FeatureConfig(_Config):

250

class FeatureConfig(_Config):

251

"""Hold configuration values about the available revlog features"""

251

"""Hold configuration values about the available revlog features"""

252

253

# the default compression engine

253

# the default compression engine

254

compression_engine = attr.ib(default=b'zlib')

254

compression_engine = attr.ib(default=b'zlib')

255

# compression engines options

255

# compression engines options

256

compression_engine_options = attr.ib(default=attr.Factory(dict))

256

compression_engine_options = attr.ib(default=attr.Factory(dict))

257

258

# can we use censor on this revlog

258

# can we use censor on this revlog

259

censorable = attr.ib(default=False)

259

censorable = attr.ib(default=False)

260

# does this revlog use the "side data" feature

260

# does this revlog use the "side data" feature

261

has_side_data = attr.ib(default=False)

261

has_side_data = attr.ib(default=False)

262

# might remove rank configuration once the computation has no impact

262

# might remove rank configuration once the computation has no impact

263

compute_rank = attr.ib(default=False)

263

compute_rank = attr.ib(default=False)

264

# parent order is supposed to be semantically irrelevant, so we

264

# parent order is supposed to be semantically irrelevant, so we

265

# normally resort parents to ensure that the first parent is non-null,

265

# normally resort parents to ensure that the first parent is non-null,

266

# if there is a non-null parent at all.

266

# if there is a non-null parent at all.

267

# filelog abuses the parent order as flag to mark some instances of

267

# filelog abuses the parent order as flag to mark some instances of

268

# meta-encoded files, so allow it to disable this behavior.

268

# meta-encoded files, so allow it to disable this behavior.

269

canonical_parent_order = attr.ib(default=False)

269

canonical_parent_order = attr.ib(default=False)

270

# can ellipsis commit be used

270

# can ellipsis commit be used

271

enable_ellipsis = attr.ib(default=False)

271

enable_ellipsis = attr.ib(default=False)

272

273

def copy(self):

273

def copy(self):

274

new = super().copy()

274

new = super().copy()

275

new.compression_engine_options = self.compression_engine_options.copy()

275

new.compression_engine_options = self.compression_engine_options.copy()

276

return new

276

return new

277

278

279

@attr.s()

279

@attr.s()

280

class DataConfig(_Config):

280

class DataConfig(_Config):

281

"""Hold configuration value about how the revlog data are read"""

281

"""Hold configuration value about how the revlog data are read"""

282

283

# should we try to open the "pending" version of the revlog

283

# should we try to open the "pending" version of the revlog

284

try_pending = attr.ib(default=False)

284

try_pending = attr.ib(default=False)

285

# should we try to open the "splitted" version of the revlog

285

# should we try to open the "splitted" version of the revlog

286

try_split = attr.ib(default=False)

286

try_split = attr.ib(default=False)

287

# When True, indexfile should be opened with checkambig=True at writing,

287

# When True, indexfile should be opened with checkambig=True at writing,

288

# to avoid file stat ambiguity.

288

# to avoid file stat ambiguity.

289

check_ambig = attr.ib(default=False)

289

check_ambig = attr.ib(default=False)

290

291

# If true, use mmap instead of reading to deal with large index

291

# If true, use mmap instead of reading to deal with large index

292

mmap_large_index = attr.ib(default=False)

292

mmap_large_index = attr.ib(default=False)

293

# how much data is large

293

# how much data is large

294

mmap_index_threshold = attr.ib(default=None)

294

mmap_index_threshold = attr.ib(default=None)

295

# How much data to read and cache into the raw revlog data cache.

295

# How much data to read and cache into the raw revlog data cache.

296

chunk_cache_size = attr.ib(default=65536)

296

chunk_cache_size = attr.ib(default=65536)

297

298

# Allow sparse reading of the revlog data

298

# Allow sparse reading of the revlog data

299

with_sparse_read = attr.ib(default=False)

299

with_sparse_read = attr.ib(default=False)

300

# minimal density of a sparse read chunk

300

# minimal density of a sparse read chunk

301

sr_density_threshold = attr.ib(default=0.50)

301

sr_density_threshold = attr.ib(default=0.50)

302

# minimal size of data we skip when performing sparse read

302

# minimal size of data we skip when performing sparse read

303

sr_min_gap_size = attr.ib(default=262144)

303

sr_min_gap_size = attr.ib(default=262144)

304

305

# are delta encoded against arbitrary bases.

305

# are delta encoded against arbitrary bases.

306

generaldelta = attr.ib(default=False)

306

generaldelta = attr.ib(default=False)

307

308

309

@attr.s()

309

@attr.s()

310

class DeltaConfig(_Config):

310

class DeltaConfig(_Config):

311

"""Hold configuration value about how new delta are computed

311

"""Hold configuration value about how new delta are computed

312

313

Some attributes are duplicated from DataConfig to help havign each object

313

Some attributes are duplicated from DataConfig to help havign each object

314

self contained.

314

self contained.

315

"""

315

"""

316

317

# can delta be encoded against arbitrary bases.

317

# can delta be encoded against arbitrary bases.

318

general_delta = attr.ib(default=False)

318

general_delta = attr.ib(default=False)

319

# Allow sparse writing of the revlog data

319

# Allow sparse writing of the revlog data

320

sparse_revlog = attr.ib(default=False)

320

sparse_revlog = attr.ib(default=False)

321

# maximum length of a delta chain

321

# maximum length of a delta chain

322

max_chain_len = attr.ib(default=None)

322

max_chain_len = attr.ib(default=None)

323

# Maximum distance between delta chain base start and end

323

# Maximum distance between delta chain base start and end

324

max_deltachain_span = attr.ib(default=-1)

324

max_deltachain_span = attr.ib(default=-1)

325

# If `upper_bound_comp` is not None, this is the expected maximal gain from

325

# If `upper_bound_comp` is not None, this is the expected maximal gain from

326

# compression for the data content.

326

# compression for the data content.

327

upper_bound_comp = attr.ib(default=None)

327

upper_bound_comp = attr.ib(default=None)

328

# Should we try a delta against both parent

328

# Should we try a delta against both parent

329

delta_both_parents = attr.ib(default=True)

329

delta_both_parents = attr.ib(default=True)

330

# Test delta base candidate group by chunk of this maximal size.

330

# Test delta base candidate group by chunk of this maximal size.

331

candidate_group_chunk_size = attr.ib(default=0)

331

candidate_group_chunk_size = attr.ib(default=0)

332

# Should we display debug information about delta computation

332

# Should we display debug information about delta computation

333

debug_delta = attr.ib(default=False)

333

debug_delta = attr.ib(default=False)

334

# trust incoming delta by default

334

# trust incoming delta by default

335

lazy_delta = attr.ib(default=True)

335

lazy_delta = attr.ib(default=True)

336

# trust the base of incoming delta by default

336

# trust the base of incoming delta by default

337

lazy_delta_base = attr.ib(default=False)

337

lazy_delta_base = attr.ib(default=False)

338

339

340

class revlog:

340

class revlog:

341

"""

341

"""

342

the underlying revision storage object

342

the underlying revision storage object

343

344

A revlog consists of two parts, an index and the revision data.

344

A revlog consists of two parts, an index and the revision data.

345

346

The index is a file with a fixed record size containing

346

The index is a file with a fixed record size containing

347

information on each revision, including its nodeid (hash), the

347

information on each revision, including its nodeid (hash), the

348

nodeids of its parents, the position and offset of its data within

348

nodeids of its parents, the position and offset of its data within

349

the data file, and the revision it's based on. Finally, each entry

349

the data file, and the revision it's based on. Finally, each entry

350

contains a linkrev entry that can serve as a pointer to external

350

contains a linkrev entry that can serve as a pointer to external

351

data.

351

data.

352

353

The revision data itself is a linear collection of data chunks.

353

The revision data itself is a linear collection of data chunks.

354

Each chunk represents a revision and is usually represented as a

354

Each chunk represents a revision and is usually represented as a

355

delta against the previous chunk. To bound lookup time, runs of

355

delta against the previous chunk. To bound lookup time, runs of

356

deltas are limited to about 2 times the length of the original

356

deltas are limited to about 2 times the length of the original

357

version data. This makes retrieval of a version proportional to

357

version data. This makes retrieval of a version proportional to

358

its size, or O(1) relative to the number of revisions.

358

its size, or O(1) relative to the number of revisions.

359

360

Both pieces of the revlog are written to in an append-only

360

Both pieces of the revlog are written to in an append-only

361

fashion, which means we never need to rewrite a file to insert or

361

fashion, which means we never need to rewrite a file to insert or

362

remove data, and can use some simple techniques to avoid the need

362

remove data, and can use some simple techniques to avoid the need

363

for locking while reading.

363

for locking while reading.

364

365

If checkambig, indexfile is opened with checkambig=True at

365

If checkambig, indexfile is opened with checkambig=True at

366

writing, to avoid file stat ambiguity.

366

writing, to avoid file stat ambiguity.

367

368

If mmaplargeindex is True, and an mmapindexthreshold is set, the

368

If mmaplargeindex is True, and an mmapindexthreshold is set, the

369

index will be mmapped rather than read if it is larger than the

369

index will be mmapped rather than read if it is larger than the

370

configured threshold.

370

configured threshold.

371

372

If censorable is True, the revlog can have censored revisions.

372

If censorable is True, the revlog can have censored revisions.

373

374

If `upperboundcomp` is not None, this is the expected maximal gain from

374

If `upperboundcomp` is not None, this is the expected maximal gain from

375

compression for the data content.

375

compression for the data content.

376

377

`concurrencychecker` is an optional function that receives 3 arguments: a

377

`concurrencychecker` is an optional function that receives 3 arguments: a

378

file handle, a filename, and an expected position. It should check whether

378

file handle, a filename, and an expected position. It should check whether

379

the current position in the file handle is valid, and log/warn/fail (by

379

the current position in the file handle is valid, and log/warn/fail (by

380

raising).

380

raising).

381

382

See mercurial/revlogutils/contants.py for details about the content of an

382

See mercurial/revlogutils/contants.py for details about the content of an

383

index entry.

383

index entry.

384

"""

384

"""

385

386

_flagserrorclass = error.RevlogError

386

_flagserrorclass = error.RevlogError

387

388

@staticmethod

388

@staticmethod

389

def is_inline_index(header_bytes):

389

def is_inline_index(header_bytes):

390

"""Determine if a revlog is inline from the initial bytes of the index"""

390

"""Determine if a revlog is inline from the initial bytes of the index"""

391

header = INDEX_HEADER.unpack(header_bytes)[0]

391

header = INDEX_HEADER.unpack(header_bytes)[0]

392

393

_format_flags = header & ~0xFFFF

393

_format_flags = header & ~0xFFFF

394

_format_version = header & 0xFFFF

394

_format_version = header & 0xFFFF

395

396

features = FEATURES_BY_VERSION[_format_version]

396

features = FEATURES_BY_VERSION[_format_version]

397

return features[b'inline'](_format_flags)

397

return features[b'inline'](_format_flags)

398

399

def __init__(

399

def __init__(

400

self,

400

self,

401

opener,

401

opener,

402

target,

402

target,

403

radix,

403

radix,

404

postfix=None, # only exist for `tmpcensored` now

404

postfix=None, # only exist for `tmpcensored` now

405

checkambig=False,

405

checkambig=False,

406

mmaplargeindex=False,

406

mmaplargeindex=False,

407

censorable=False,

407

censorable=False,

408

upperboundcomp=None,

408

upperboundcomp=None,

409

persistentnodemap=False,

409

persistentnodemap=False,

410

concurrencychecker=None,

410

concurrencychecker=None,

411

trypending=False,

411

trypending=False,

412

try_split=False,

412

try_split=False,

413

canonical_parent_order=True,

413

canonical_parent_order=True,

414

):

414

):

415

"""

415

"""

416

create a revlog object

416

create a revlog object

417

418

opener is a function that abstracts the file opening operation

418

opener is a function that abstracts the file opening operation

419

and can be used to implement COW semantics or the like.

419

and can be used to implement COW semantics or the like.

420

421

`target`: a (KIND, ID) tuple that identify the content stored in

421

`target`: a (KIND, ID) tuple that identify the content stored in

422

this revlog. It help the rest of the code to understand what the revlog

422

this revlog. It help the rest of the code to understand what the revlog

423

is about without having to resort to heuristic and index filename

423

is about without having to resort to heuristic and index filename

424

analysis. Note: that this must be reliably be set by normal code, but

424

analysis. Note: that this must be reliably be set by normal code, but

425

that test, debug, or performance measurement code might not set this to

425

that test, debug, or performance measurement code might not set this to

426

accurate value.

426

accurate value.

427

"""

427

"""

428

self.upperboundcomp = upperboundcomp

428

self.upperboundcomp = upperboundcomp

429

430

self.radix = radix

430

self.radix = radix

431

432

self._docket_file = None

432

self._docket_file = None

433

self._indexfile = None

433

self._indexfile = None

434

self._datafile = None

434

self._datafile = None

435

self._sidedatafile = None

435

self._sidedatafile = None

436

self._nodemap_file = None

436

self._nodemap_file = None

437

self.postfix = postfix

437

self.postfix = postfix

438

self._trypending = trypending

438

self._trypending = trypending

439

self._try_split = try_split

439

self._try_split = try_split

440

self.opener = opener

440

self.opener = opener

441

if persistentnodemap:

441

if persistentnodemap:

442

self._nodemap_file = nodemaputil.get_nodemap_file(self)

442

self._nodemap_file = nodemaputil.get_nodemap_file(self)

443

444

assert target[0] in ALL_KINDS

444

assert target[0] in ALL_KINDS

445

assert len(target) == 2

445

assert len(target) == 2

446

self.target = target

446

self.target = target

447

if b'feature-config' in self.opener.options:

447

if b'feature-config' in self.opener.options:

448

self.feature_config = self.opener.options[b'feature-config'].copy()

448

self.feature_config = self.opener.options[b'feature-config'].copy()

449

else:

449

else:

450

self.feature_config = FeatureConfig()

450

self.feature_config = FeatureConfig()

451

self.feature_config.censorable = censorable

451

self.feature_config.censorable = censorable

452

self.feature_config.canonical_parent_order = canonical_parent_order

452

self.feature_config.canonical_parent_order = canonical_parent_order

453

if b'data-config' in self.opener.options:

453

if b'data-config' in self.opener.options:

454

self.data_config = self.opener.options[b'data-config'].copy()

454

self.data_config = self.opener.options[b'data-config'].copy()

455

else:

455

else:

456

self.data_config = DataConfig()

456

self.data_config = DataConfig()

457

self.data_config.check_ambig = checkambig

457

self.data_config.check_ambig = checkambig

458

self.data_config.mmap_large_index = mmaplargeindex

458

self.data_config.mmap_large_index = mmaplargeindex

459

if b'delta-config' in self.opener.options:

459

if b'delta-config' in self.opener.options:

460

self.delta_config = self.opener.options[b'delta-config'].copy()

460

self.delta_config = self.opener.options[b'delta-config'].copy()

461

else:

461

else:

462

self.delta_config = DeltaConfig()

462

self.delta_config = DeltaConfig()

463

464

# 3-tuple of (node, rev, text) for a raw revision.

464

# 3-tuple of (node, rev, text) for a raw revision.

465

self._revisioncache = None

465

self._revisioncache = None

466

# Maps rev to chain base rev.

466

# Maps rev to chain base rev.

467

self._chainbasecache = util.lrucachedict(100)

467

self._chainbasecache = util.lrucachedict(100)

468

# 2-tuple of (offset, data) of raw data from the revlog at an offset.

468

# 2-tuple of (offset, data) of raw data from the revlog at an offset.

469

self._chunkcache = (0, b'')

469

self._chunkcache = (0, b'')

470

471

self.index = None

471

self.index = None

472

self._docket = None

472

self._docket = None

473

self._nodemap_docket = None

473

self._nodemap_docket = None

474

# Mapping of partial identifiers to full nodes.

474

# Mapping of partial identifiers to full nodes.

475

self._pcache = {}

475

self._pcache = {}

476

477

# other optionnals features

477

# other optionnals features

478

479

# Make copy of flag processors so each revlog instance can support

479

# Make copy of flag processors so each revlog instance can support

480

# custom flags.

480

# custom flags.

481

self._flagprocessors = dict(flagutil.flagprocessors)

481

self._flagprocessors = dict(flagutil.flagprocessors)

482

483

# 3-tuple of file handles being used for active writing.

483

# 3-tuple of file handles being used for active writing.

484

self._writinghandles = None

484

self._writinghandles = None

485

# prevent nesting of addgroup

485

# prevent nesting of addgroup

486

self._adding_group = None

486

self._adding_group = None

487

488

self._loadindex()

488

self._loadindex()

489

490

self._concurrencychecker = concurrencychecker

490

self._concurrencychecker = concurrencychecker

491

492

@property

492

@property

493

def _generaldelta(self):

493

def _generaldelta(self):

494

"""temporary compatibility proxy"""

494

"""temporary compatibility proxy"""

495

return self.delta_config.general_delta

495

return self.delta_config.general_delta

496

497

@property

497

@property

498

def _checkambig(self):

498

def _checkambig(self):

499

"""temporary compatibility proxy"""

499

"""temporary compatibility proxy"""

500

return self.data_config.check_ambig

500

return self.data_config.check_ambig

501

502

@property

502

@property

503

def _mmaplargeindex(self):

503

def _mmaplargeindex(self):

504

"""temporary compatibility proxy"""

504

"""temporary compatibility proxy"""

505

return self.data_config.mmap_large_index

505

return self.data_config.mmap_large_index

506

507

@property

507

@property

508

def _censorable(self):

508

def _censorable(self):

509

"""temporary compatibility proxy"""

509

"""temporary compatibility proxy"""

510

return self.feature_config.censorable

510

return self.feature_config.censorable

511

512

@property

512

@property

513

def _chunkcachesize(self):

513

def _chunkcachesize(self):

514

"""temporary compatibility proxy"""

514

"""temporary compatibility proxy"""

515

return self.data_config.chunk_cache_size

515

return self.data_config.chunk_cache_size

516

517

@property

517

@property

518

def _maxchainlen(self):

518

def _maxchainlen(self):

519

"""temporary compatibility proxy"""

519

"""temporary compatibility proxy"""

520

return self.delta_config.max_chain_len

520

return self.delta_config.max_chain_len

521

522

@property

522

@property

523

def _deltabothparents(self):

523

def _deltabothparents(self):

524

"""temporary compatibility proxy"""

524

"""temporary compatibility proxy"""

525

return self.delta_config.delta_both_parents

525

return self.delta_config.delta_both_parents

526

527

@property

527

@property

528

def _candidate_group_chunk_size(self):

528

def _candidate_group_chunk_size(self):

529

"""temporary compatibility proxy"""

529

"""temporary compatibility proxy"""

530

return self.delta_config.candidate_group_chunk_size

530

return self.delta_config.candidate_group_chunk_size

531

532

@property

532

@property

533

def _debug_delta(self):

533

def _debug_delta(self):

534

"""temporary compatibility proxy"""

534

"""temporary compatibility proxy"""

535

return self.delta_config.debug_delta

535

return self.delta_config.debug_delta

536

537

@property

537

@property

538

def _compengine(self):

538

def _compengine(self):

539

"""temporary compatibility proxy"""

539

"""temporary compatibility proxy"""

540

return self.feature_config.compression_engine

540

return self.feature_config.compression_engine

541

542

@property

542

@property

543

def _compengineopts(self):

543

def _compengineopts(self):

544

"""temporary compatibility proxy"""

544

"""temporary compatibility proxy"""

545

return self.feature_config.compression_engine_options

545

return self.feature_config.compression_engine_options

546

547

@property

547

@property

548

def _maxdeltachainspan(self):

548

def _maxdeltachainspan(self):

549

"""temporary compatibility proxy"""

549

"""temporary compatibility proxy"""

550

return self.delta_config.max_deltachain_span

550

return self.delta_config.max_deltachain_span

551

552

@property

552

@property

553

def _withsparseread(self):

553

def _withsparseread(self):

554

"""temporary compatibility proxy"""

554

"""temporary compatibility proxy"""

555

return self.data_config.with_sparse_read

555

return self.data_config.with_sparse_read

556

557

@property

557

@property

558

def _sparserevlog(self):

558

def _sparserevlog(self):

559

"""temporary compatibility proxy"""

559

"""temporary compatibility proxy"""

560

return self.delta_config.sparse_revlog

560

return self.delta_config.sparse_revlog

561

562

@property

562

@property

563

def hassidedata(self):

563

def hassidedata(self):

564

"""temporary compatibility proxy"""

564

"""temporary compatibility proxy"""

565

return self.feature_config.has_side_data

565

return self.feature_config.has_side_data

566

567

@property

567

@property

568

def _srdensitythreshold(self):

568

def _srdensitythreshold(self):

569

"""temporary compatibility proxy"""

569

"""temporary compatibility proxy"""

570

return self.data_config.sr_density_threshold

570

return self.data_config.sr_density_threshold

571

572

@property

572

@property

573

def _srmingapsize(self):

573

def _srmingapsize(self):

574

"""temporary compatibility proxy"""

574

"""temporary compatibility proxy"""

575

return self.data_config.sr_min_gap_size

575

return self.data_config.sr_min_gap_size

576

577

@property

577

@property

578

def _compute_rank(self):

578

def _compute_rank(self):

579

"""temporary compatibility proxy"""

579

"""temporary compatibility proxy"""

580

return self.feature_config.compute_rank

580

return self.feature_config.compute_rank

581

582

@property

582

@property

583

def canonical_parent_order(self):

583

def canonical_parent_order(self):

584

"""temporary compatibility proxy"""

584

"""temporary compatibility proxy"""

585

return self.feature_config.canonical_parent_order

585

return self.feature_config.canonical_parent_order

586

587

@property

587

@property

588

def _lazydelta(self):

588

def _lazydelta(self):

589

"""temporary compatibility proxy"""

589

"""temporary compatibility proxy"""

590

return self.delta_config.lazy_delta

590

return self.delta_config.lazy_delta

591

592

@property

592

@property

593

def _lazydeltabase(self):

593

def _lazydeltabase(self):

594

"""temporary compatibility proxy"""

594

"""temporary compatibility proxy"""

595

return self.delta_config.lazy_delta_base

595

return self.delta_config.lazy_delta_base

596

597

def _init_opts(self):

597

def _init_opts(self):

598

"""process options (from above/config) to setup associated default revlog mode

598

"""process options (from above/config) to setup associated default revlog mode

599

600

These values might be affected when actually reading on disk information.

600

These values might be affected when actually reading on disk information.

601

602

The relevant values are returned for use in _loadindex().

602

The relevant values are returned for use in _loadindex().

603

604

* newversionflags:

604

* newversionflags:

605

version header to use if we need to create a new revlog

605

version header to use if we need to create a new revlog

606

607

* mmapindexthreshold:

607

* mmapindexthreshold:

608

minimal index size for start to use mmap

608

minimal index size for start to use mmap

609

610

* force_nodemap:

610

* force_nodemap:

611

force the usage of a "development" version of the nodemap code

611

force the usage of a "development" version of the nodemap code

612

"""

612

"""

613

opts = self.opener.options

613

opts = self.opener.options

614

615

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

615

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

616

new_header = CHANGELOGV2

616

new_header = CHANGELOGV2

617

compute_rank = opts.get(b'changelogv2.compute-rank', True)

617

compute_rank = opts.get(b'changelogv2.compute-rank', True)

618

self.feature_config.compute_rank = compute_rank

618

self.feature_config.compute_rank = compute_rank

619

elif b'revlogv2' in opts:

619

elif b'revlogv2' in opts:

620

new_header = REVLOGV2

620

new_header = REVLOGV2

621

elif b'revlogv1' in opts:

621

elif b'revlogv1' in opts:

622

new_header = REVLOGV1 | FLAG_INLINE_DATA

622

new_header = REVLOGV1 | FLAG_INLINE_DATA

623

if b'generaldelta' in opts:

623

if b'generaldelta' in opts:

624

new_header |= FLAG_GENERALDELTA

624

new_header |= FLAG_GENERALDELTA

625

elif b'revlogv0' in self.opener.options:

625

elif b'revlogv0' in self.opener.options:

626

new_header = REVLOGV0

626

new_header = REVLOGV0

627

else:

627

else:

628

new_header = REVLOG_DEFAULT_VERSION

628

new_header = REVLOG_DEFAULT_VERSION

629

630

mmapindexthreshold = None

630

mmapindexthreshold = None

631

if self.data_config.mmap_large_index:

631

if self.data_config.mmap_large_index:

632

mmapindexthreshold = self.data_config.mmap_index_threshold

632

mmapindexthreshold = self.data_config.mmap_index_threshold

633

if self.feature_config.enable_ellipsis:

633

if self.feature_config.enable_ellipsis:

634

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

634

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

635

636

# revlog v0 doesn't have flag processors

636

# revlog v0 doesn't have flag processors

637

for flag, processor in opts.get(b'flagprocessors', {}).items():

637

for flag, processor in opts.get(b'flagprocessors', {}).items():

638

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

638

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

639

640

chunk_cache_size = self.data_config.chunk_cache_size

640

chunk_cache_size = self.data_config.chunk_cache_size

641

if chunk_cache_size <= 0:

641

if chunk_cache_size <= 0:

642

raise error.RevlogError(

642

raise error.RevlogError(

643

_(b'revlog chunk cache size %r is not greater than 0')

643

_(b'revlog chunk cache size %r is not greater than 0')

644

% chunk_cache_size

644

% chunk_cache_size

645

)

645

)

646

elif chunk_cache_size & (chunk_cache_size - 1):

646

elif chunk_cache_size & (chunk_cache_size - 1):

647

raise error.RevlogError(

647

raise error.RevlogError(

648

_(b'revlog chunk cache size %r is not a power of 2')

648

_(b'revlog chunk cache size %r is not a power of 2')

649

% chunk_cache_size

649

% chunk_cache_size

650

)

650

)

651

force_nodemap = opts.get(b'devel-force-nodemap', False)

651

force_nodemap = opts.get(b'devel-force-nodemap', False)

652

return new_header, mmapindexthreshold, force_nodemap

652

return new_header, mmapindexthreshold, force_nodemap

653

654

def _get_data(self, filepath, mmap_threshold, size=None):

654

def _get_data(self, filepath, mmap_threshold, size=None):

655

"""return a file content with or without mmap

655

"""return a file content with or without mmap

656

657

If the file is missing return the empty string"""

657

If the file is missing return the empty string"""

658

try:

658

try:

659

with self.opener(filepath) as fp:

659

with self.opener(filepath) as fp:

660

if mmap_threshold is not None:

660

if mmap_threshold is not None:

661

file_size = self.opener.fstat(fp).st_size

661

file_size = self.opener.fstat(fp).st_size

662

if file_size >= mmap_threshold:

662

if file_size >= mmap_threshold:

663

if size is not None:

663

if size is not None:

664

# avoid potentiel mmap crash

664

# avoid potentiel mmap crash

665

size = min(file_size, size)

665

size = min(file_size, size)

666

# TODO: should .close() to release resources without

666

# TODO: should .close() to release resources without

667

# relying on Python GC

667

# relying on Python GC

668

if size is None:

668

if size is None:

669

return util.buffer(util.mmapread(fp))

669

return util.buffer(util.mmapread(fp))

670

else:

670

else:

671

return util.buffer(util.mmapread(fp, size))

671

return util.buffer(util.mmapread(fp, size))

672

if size is None:

672

if size is None:

673

return fp.read()

673

return fp.read()

674

else:

674

else:

675

return fp.read(size)

675

return fp.read(size)

676

except FileNotFoundError:

676

except FileNotFoundError:

677

return b''

677

return b''

678

679

def get_streams(self, max_linkrev, force_inline=False):

679

def get_streams(self, max_linkrev, force_inline=False):

680

"""return a list of streams that represent this revlog

680

"""return a list of streams that represent this revlog

681

682

This is used by stream-clone to do bytes to bytes copies of a repository.

682

This is used by stream-clone to do bytes to bytes copies of a repository.

683

684

This streams data for all revisions that refer to a changelog revision up

684

This streams data for all revisions that refer to a changelog revision up

685

to `max_linkrev`.

685

to `max_linkrev`.

686

687

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

687

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

688

689

It returns is a list of three-tuple:

689

It returns is a list of three-tuple:

690

691

[

691

[

692

(filename, bytes_stream, stream_size),

692

(filename, bytes_stream, stream_size),

693

…

693

…

694

]

694

]

695

"""

695

"""

696

n = len(self)

696

n = len(self)

697

index = self.index

697

index = self.index

698

while n > 0:

698

while n > 0:

699

linkrev = index[n - 1][4]

699

linkrev = index[n - 1][4]

700

if linkrev < max_linkrev:

700

if linkrev < max_linkrev:

701

break

701

break

702

# note: this loop will rarely go through multiple iterations, since

702

# note: this loop will rarely go through multiple iterations, since

703

# it only traverses commits created during the current streaming

703

# it only traverses commits created during the current streaming

704

# pull operation.

704

# pull operation.

705

#

705

#

706

# If this become a problem, using a binary search should cap the

706

# If this become a problem, using a binary search should cap the

707

# runtime of this.

707

# runtime of this.

708

n = n - 1

708

n = n - 1

709

if n == 0:

709

if n == 0:

710

# no data to send

710

# no data to send

711

return []

711

return []

712

index_size = n * index.entry_size

712

index_size = n * index.entry_size

713

data_size = self.end(n - 1)

713

data_size = self.end(n - 1)

714

715

# XXX we might have been split (or stripped) since the object

715

# XXX we might have been split (or stripped) since the object

716

# initialization, We need to close this race too, but having a way to

716

# initialization, We need to close this race too, but having a way to

717

# pre-open the file we feed to the revlog and never closing them before

717

# pre-open the file we feed to the revlog and never closing them before

718

# we are done streaming.

718

# we are done streaming.

719

720

if self._inline:

720

if self._inline:

721

722

def get_stream():

722

def get_stream():

723

with self._indexfp() as fp:

723

with self._indexfp() as fp:

724

yield None

724

yield None

725

size = index_size + data_size

725

size = index_size + data_size

726

if size <= 65536:

726

if size <= 65536:

727

yield fp.read(size)

727

yield fp.read(size)

728

else:

728

else:

729

yield from util.filechunkiter(fp, limit=size)

729

yield from util.filechunkiter(fp, limit=size)

730

731

inline_stream = get_stream()

731

inline_stream = get_stream()

732

next(inline_stream)

732

next(inline_stream)

733

return [

733

return [

734

(self._indexfile, inline_stream, index_size + data_size),

734

(self._indexfile, inline_stream, index_size + data_size),

735

]

735

]

736

elif force_inline:

736

elif force_inline:

737

738

def get_stream():

738

def get_stream():

739

with self.reading():

739

with self.reading():

740

yield None

740

yield None

741

742

for rev in range(n):

742

for rev in range(n):

743

idx = self.index.entry_binary(rev)

743

idx = self.index.entry_binary(rev)

744

if rev == 0 and self._docket is None:

744

if rev == 0 and self._docket is None:

745

# re-inject the inline flag

745

# re-inject the inline flag

746

header = self._format_flags

746

header = self._format_flags

747

header |= self._format_version

747

header |= self._format_version

748

header |= FLAG_INLINE_DATA

748

header |= FLAG_INLINE_DATA

749

header = self.index.pack_header(header)

749

header = self.index.pack_header(header)

750

idx = header + idx

750

idx = header + idx

751

yield idx

751

yield idx

752

yield self._getsegmentforrevs(rev, rev)[1]

752

yield self._getsegmentforrevs(rev, rev)[1]

753

754

inline_stream = get_stream()

754

inline_stream = get_stream()

755

next(inline_stream)

755

next(inline_stream)

756

return [

756

return [

757

(self._indexfile, inline_stream, index_size + data_size),

757

(self._indexfile, inline_stream, index_size + data_size),

758

]

758

]

759

else:

759

else:

760

761

def get_index_stream():

761

def get_index_stream():

762

with self._indexfp() as fp:

762

with self._indexfp() as fp:

763

yield None

763

yield None

764

if index_size <= 65536:

764

if index_size <= 65536:

765

yield fp.read(index_size)

765

yield fp.read(index_size)

766

else:

766

else:

767

yield from util.filechunkiter(fp, limit=index_size)

767

yield from util.filechunkiter(fp, limit=index_size)

768

769

def get_data_stream():

769

def get_data_stream():

770

with self._datafp() as fp:

770

with self._datafp() as fp:

771

yield None

771

yield None

772

if data_size <= 65536:

772

if data_size <= 65536:

773

yield fp.read(data_size)

773

yield fp.read(data_size)

774

else:

774

else:

775

yield from util.filechunkiter(fp, limit=data_size)

775

yield from util.filechunkiter(fp, limit=data_size)

776

777

index_stream = get_index_stream()

777

index_stream = get_index_stream()

778

next(index_stream)

778

next(index_stream)

779

data_stream = get_data_stream()

779

data_stream = get_data_stream()

780

next(data_stream)

780

next(data_stream)

781

return [

781

return [

782

(self._datafile, data_stream, data_size),

782

(self._datafile, data_stream, data_size),

783

(self._indexfile, index_stream, index_size),

783

(self._indexfile, index_stream, index_size),

784

]

784

]

785

786

def _loadindex(self, docket=None):

786

def _loadindex(self, docket=None):

787

788

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

788

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

789

790

if self.postfix is not None:

790

if self.postfix is not None:

791

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

791

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

792

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

792

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

793

entry_point = b'%s.i.a' % self.radix

793

entry_point = b'%s.i.a' % self.radix

794

elif self._try_split and self.opener.exists(self._split_index_file):

794

elif self._try_split and self.opener.exists(self._split_index_file):

795

entry_point = self._split_index_file

795

entry_point = self._split_index_file

796

else:

796

else:

797

entry_point = b'%s.i' % self.radix

797

entry_point = b'%s.i' % self.radix

798

799

if docket is not None:

799

if docket is not None:

800

self._docket = docket

800

self._docket = docket

801

self._docket_file = entry_point

801

self._docket_file = entry_point

802

else:

802

else:

803

self._initempty = True

803

self._initempty = True

804

entry_data = self._get_data(entry_point, mmapindexthreshold)

804

entry_data = self._get_data(entry_point, mmapindexthreshold)

805

if len(entry_data) > 0:

805

if len(entry_data) > 0:

806

header = INDEX_HEADER.unpack(entry_data[:4])[0]

806

header = INDEX_HEADER.unpack(entry_data[:4])[0]

807

self._initempty = False

807

self._initempty = False

808

else:

808

else:

809

header = new_header

809

header = new_header

810

811

self._format_flags = header & ~0xFFFF

811

self._format_flags = header & ~0xFFFF

812

self._format_version = header & 0xFFFF

812

self._format_version = header & 0xFFFF

813

814

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

814

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

815

if supported_flags is None:

815

if supported_flags is None:

816

msg = _(b'unknown version (%d) in revlog %s')

816

msg = _(b'unknown version (%d) in revlog %s')

817

msg %= (self._format_version, self.display_id)

817

msg %= (self._format_version, self.display_id)

818

raise error.RevlogError(msg)

818

raise error.RevlogError(msg)

819

elif self._format_flags & ~supported_flags:

819

elif self._format_flags & ~supported_flags:

820

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

820

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

821

display_flag = self._format_flags >> 16

821

display_flag = self._format_flags >> 16

822

msg %= (display_flag, self._format_version, self.display_id)

822

msg %= (display_flag, self._format_version, self.display_id)

823

raise error.RevlogError(msg)

823

raise error.RevlogError(msg)

824

825

features = FEATURES_BY_VERSION[self._format_version]

825

features = FEATURES_BY_VERSION[self._format_version]

826

self._inline = features[b'inline'](self._format_flags)

826

self._inline = features[b'inline'](self._format_flags)

827

self.delta_config.general_delta = features[b'generaldelta'](

827

self.delta_config.general_delta = features[b'generaldelta'](

828

self._format_flags

828

self._format_flags

829

)

829

)

830

self.feature_config.has_side_data = features[b'sidedata']

830

self.feature_config.has_side_data = features[b'sidedata']

831

832

if not features[b'docket']:

832

if not features[b'docket']:

833

self._indexfile = entry_point

833

self._indexfile = entry_point

834

index_data = entry_data

834

index_data = entry_data

835

else:

835

else:

836

self._docket_file = entry_point

836

self._docket_file = entry_point

837

if self._initempty:

837

if self._initempty:

838

self._docket = docketutil.default_docket(self, header)

838

self._docket = docketutil.default_docket(self, header)

839

else:

839

else:

840

self._docket = docketutil.parse_docket(

840

self._docket = docketutil.parse_docket(

841

self, entry_data, use_pending=self._trypending

841

self, entry_data, use_pending=self._trypending

842

)

842

)

843

844

if self._docket is not None:

844

if self._docket is not None:

845

self._indexfile = self._docket.index_filepath()

845

self._indexfile = self._docket.index_filepath()

846

index_data = b''

846

index_data = b''

847

index_size = self._docket.index_end

847

index_size = self._docket.index_end

848

if index_size > 0:

848

if index_size > 0:

849

index_data = self._get_data(

849

index_data = self._get_data(

850

self._indexfile, mmapindexthreshold, size=index_size

850

self._indexfile, mmapindexthreshold, size=index_size

851

)

851

)

852

if len(index_data) < index_size:

852

if len(index_data) < index_size:

853

msg = _(b'too few index data for %s: got %d, expected %d')

853

msg = _(b'too few index data for %s: got %d, expected %d')

854

msg %= (self.display_id, len(index_data), index_size)

854

msg %= (self.display_id, len(index_data), index_size)

855

raise error.RevlogError(msg)

855

raise error.RevlogError(msg)

856

857

self._inline = False

857

self._inline = False

858

# generaldelta implied by version 2 revlogs.

858

# generaldelta implied by version 2 revlogs.

859

self.delta_config.general_delta = True

859

self.delta_config.general_delta = True

860

# the logic for persistent nodemap will be dealt with within the

860

# the logic for persistent nodemap will be dealt with within the

861

# main docket, so disable it for now.

861

# main docket, so disable it for now.

862

self._nodemap_file = None

862

self._nodemap_file = None

863

864

if self._docket is not None:

864

if self._docket is not None:

865

self._datafile = self._docket.data_filepath()

865

self._datafile = self._docket.data_filepath()

866

self._sidedatafile = self._docket.sidedata_filepath()

866

self._sidedatafile = self._docket.sidedata_filepath()

867

elif self.postfix is None:

867

elif self.postfix is None:

868

self._datafile = b'%s.d' % self.radix

868

self._datafile = b'%s.d' % self.radix

869

else:

869

else:

870

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

870

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

871

872

self.nodeconstants = sha1nodeconstants

872

self.nodeconstants = sha1nodeconstants

873

self.nullid = self.nodeconstants.nullid

873

self.nullid = self.nodeconstants.nullid

874

875

# sparse-revlog can't be on without general-delta (issue6056)

875

# sparse-revlog can't be on without general-delta (issue6056)

876

if not self.delta_config.general_delta:

876

if not self.delta_config.general_delta:

877

self.delta_config.sparse_revlog = False

877

self.delta_config.sparse_revlog = False

878

879

self._storedeltachains = True

879

self._storedeltachains = True

880

881

devel_nodemap = (

881

devel_nodemap = (

882

self._nodemap_file

882

self._nodemap_file

883

and force_nodemap

883

and force_nodemap

884

and parse_index_v1_nodemap is not None

884

and parse_index_v1_nodemap is not None

885

)

885

)

886

887

use_rust_index = False

887

use_rust_index = False

888

if rustrevlog is not None:

888

if rustrevlog is not None:

889

if self._nodemap_file is not None:

889

if self._nodemap_file is not None:

890

use_rust_index = True

890

use_rust_index = True

891

else:

891

else:

892

use_rust_index = self.opener.options.get(b'rust.index')

892

use_rust_index = self.opener.options.get(b'rust.index')

893

894

self._parse_index = parse_index_v1

894

self._parse_index = parse_index_v1

895

if self._format_version == REVLOGV0:

895

if self._format_version == REVLOGV0:

896

self._parse_index = revlogv0.parse_index_v0

896

self._parse_index = revlogv0.parse_index_v0

897

elif self._format_version == REVLOGV2:

897

elif self._format_version == REVLOGV2:

898

self._parse_index = parse_index_v2

898

self._parse_index = parse_index_v2

899

elif self._format_version == CHANGELOGV2:

899

elif self._format_version == CHANGELOGV2:

900

self._parse_index = parse_index_cl_v2

900

self._parse_index = parse_index_cl_v2

901

elif devel_nodemap:

901

elif devel_nodemap:

902

self._parse_index = parse_index_v1_nodemap

902

self._parse_index = parse_index_v1_nodemap

903

elif use_rust_index:

903

elif use_rust_index:

904

self._parse_index = parse_index_v1_mixed

904

self._parse_index = parse_index_v1_mixed

905

try:

905

try:

906

d = self._parse_index(index_data, self._inline)

906

d = self._parse_index(index_data, self._inline)

907

index, chunkcache = d

907

index, chunkcache = d

908

use_nodemap = (

908

use_nodemap = (

909

not self._inline

909

not self._inline

910

and self._nodemap_file is not None

910

and self._nodemap_file is not None

911

and hasattr(index, 'update_nodemap_data')

911

and hasattr(index, 'update_nodemap_data')

912

)

912

)

913

if use_nodemap:

913

if use_nodemap:

914

nodemap_data = nodemaputil.persisted_data(self)

914

nodemap_data = nodemaputil.persisted_data(self)

915

if nodemap_data is not None:

915

if nodemap_data is not None:

916

docket = nodemap_data[0]

916

docket = nodemap_data[0]

917

if (

917

if (

918

len(d[0]) > docket.tip_rev

918

len(d[0]) > docket.tip_rev

919

and d[0][docket.tip_rev][7] == docket.tip_node

919

and d[0][docket.tip_rev][7] == docket.tip_node

920

):

920

):

921

# no changelog tampering

921

# no changelog tampering

922

self._nodemap_docket = docket

922

self._nodemap_docket = docket

923

index.update_nodemap_data(*nodemap_data)

923

index.update_nodemap_data(*nodemap_data)

924

except (ValueError, IndexError):

924

except (ValueError, IndexError):

925

raise error.RevlogError(

925

raise error.RevlogError(

926

_(b"index %s is corrupted") % self.display_id

926

_(b"index %s is corrupted") % self.display_id

927

)

927

)

928

self.index = index

928

self.index = index

929

self._segmentfile = randomaccessfile.randomaccessfile(

929

self._segmentfile = randomaccessfile.randomaccessfile(

930

self.opener,

930

self.opener,

931

(self._indexfile if self._inline else self._datafile),

931

(self._indexfile if self._inline else self._datafile),

932

self._chunkcachesize,

932

self._chunkcachesize,

933

chunkcache,

933

chunkcache,

934

)

934

)

935

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

935

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

936

self.opener,

936

self.opener,

937

self._sidedatafile,

937

self._sidedatafile,

938

self._chunkcachesize,

938

self._chunkcachesize,

939

)

939

)

940

# revnum -> (chain-length, sum-delta-length)

940

# revnum -> (chain-length, sum-delta-length)

941

self._chaininfocache = util.lrucachedict(500)

941

self._chaininfocache = util.lrucachedict(500)

942

# revlog header -> revlog compressor

942

# revlog header -> revlog compressor

943

self._decompressors = {}

943

self._decompressors = {}

944

945

def get_revlog(self):

945

def get_revlog(self):

946

"""simple function to mirror API of other not-really-revlog API"""

946

"""simple function to mirror API of other not-really-revlog API"""

947

return self

947

return self

948

949

@util.propertycache

949

@util.propertycache

950

def revlog_kind(self):

950

def revlog_kind(self):

951

return self.target[0]

951

return self.target[0]

952

953

@util.propertycache

953

@util.propertycache

954

def display_id(self):

954

def display_id(self):

955

"""The public facing "ID" of the revlog that we use in message"""

955

"""The public facing "ID" of the revlog that we use in message"""

956

if self.revlog_kind == KIND_FILELOG:

956

if self.revlog_kind == KIND_FILELOG:

957

# Reference the file without the "data/" prefix, so it is familiar

957

# Reference the file without the "data/" prefix, so it is familiar

958

# to the user.

958

# to the user.

959

return self.target[1]

959

return self.target[1]

960

else:

960

else:

961

return self.radix

961

return self.radix

962

963

def _get_decompressor(self, t):

963

def _get_decompressor(self, t):

964

try:

964

try:

965

compressor = self._decompressors[t]

965

compressor = self._decompressors[t]

966

except KeyError:

966

except KeyError:

967

try:

967

try:

968

engine = util.compengines.forrevlogheader(t)

968

engine = util.compengines.forrevlogheader(t)

969

compressor = engine.revlogcompressor(self._compengineopts)

969

compressor = engine.revlogcompressor(self._compengineopts)

970

self._decompressors[t] = compressor

970

self._decompressors[t] = compressor

971

except KeyError:

971

except KeyError:

972

raise error.RevlogError(

972

raise error.RevlogError(

973

_(b'unknown compression type %s') % binascii.hexlify(t)

973

_(b'unknown compression type %s') % binascii.hexlify(t)

974

)

974

)

975

return compressor

975

return compressor

976

977

@util.propertycache

977

@util.propertycache

978

def _compressor(self):

978

def _compressor(self):

979

engine = util.compengines[self._compengine]

979

engine = util.compengines[self._compengine]

980

return engine.revlogcompressor(self._compengineopts)

980

return engine.revlogcompressor(self._compengineopts)

981

982

@util.propertycache

982

@util.propertycache

983

def _decompressor(self):

983

def _decompressor(self):

984

"""the default decompressor"""

984

"""the default decompressor"""

985

if self._docket is None:

985

if self._docket is None:

986

return None

986

return None

987

t = self._docket.default_compression_header

987

t = self._docket.default_compression_header

988

c = self._get_decompressor(t)

988

c = self._get_decompressor(t)

989

return c.decompress

989

return c.decompress

990

991

def _indexfp(self):

991

def _indexfp(self):

992

"""file object for the revlog's index file"""

992

"""file object for the revlog's index file"""

993

return self.opener(self._indexfile, mode=b"r")

993

return self.opener(self._indexfile, mode=b"r")

994

995

def __index_write_fp(self):

995

def __index_write_fp(self):

996

# You should not use this directly and use `_writing` instead

996

# You should not use this directly and use `_writing` instead

997

try:

997

try:

998

f = self.opener(

998

f = self.opener(

999

self._indexfile,

999

self._indexfile,

1000

mode=b"r+",

1000

mode=b"r+",

1001

checkambig=self.data_config.check_ambig,

1001

checkambig=self.data_config.check_ambig,

1002

)

1002

)

1003

if self._docket is None:

1003

if self._docket is None:

1004

f.seek(0, os.SEEK_END)

1004

f.seek(0, os.SEEK_END)

1005

else:

1005

else:

1006

f.seek(self._docket.index_end, os.SEEK_SET)

1006

f.seek(self._docket.index_end, os.SEEK_SET)

1007

return f

1007

return f

1008

except FileNotFoundError:

1008

except FileNotFoundError:

1009

return self.opener(

1009

return self.opener(

1010

self._indexfile,

1010

self._indexfile,

1011

mode=b"w+",

1011

mode=b"w+",

1012

checkambig=self.data_config.check_ambig,

1012

checkambig=self.data_config.check_ambig,

1013

)

1013

)

1014

1015

def __index_new_fp(self):

1015

def __index_new_fp(self):

1016

# You should not use this unless you are upgrading from inline revlog

1016

# You should not use this unless you are upgrading from inline revlog

1017

return self.opener(

1017

return self.opener(

1018

self._indexfile,

1018

self._indexfile,

1019

mode=b"w",

1019

mode=b"w",

1020

checkambig=self.data_config.check_ambig,

1020

checkambig=self.data_config.check_ambig,

1021

atomictemp=True,

1021

atomictemp=True,

1022

)

1022

)

1023

1024

def _datafp(self, mode=b'r'):

1024

def _datafp(self, mode=b'r'):

1025

"""file object for the revlog's data file"""

1025

"""file object for the revlog's data file"""

1026

return self.opener(self._datafile, mode=mode)

1026

return self.opener(self._datafile, mode=mode)

1027

1028

@contextlib.contextmanager

1028

@contextlib.contextmanager

1029

def _sidedatareadfp(self):

1029

def _sidedatareadfp(self):

1030

"""file object suitable to read sidedata"""

1030

"""file object suitable to read sidedata"""

1031

if self._writinghandles:

1031

if self._writinghandles:

1032

yield self._writinghandles[2]

1032

yield self._writinghandles[2]

1033

else:

1033

else:

1034

with self.opener(self._sidedatafile) as fp:

1034

with self.opener(self._sidedatafile) as fp:

1035

yield fp

1035

yield fp

1036

1037

def tiprev(self):

1037

def tiprev(self):

1038

return len(self.index) - 1

1038

return len(self.index) - 1

1039

1040

def tip(self):

1040

def tip(self):

1041

return self.node(self.tiprev())

1041

return self.node(self.tiprev())

1042

1043

def __contains__(self, rev):

1043

def __contains__(self, rev):

1044

return 0 <= rev < len(self)

1044

return 0 <= rev < len(self)

1045

1046

def __len__(self):

1046

def __len__(self):

1047

return len(self.index)

1047

return len(self.index)

1048

1049

def __iter__(self):

1049

def __iter__(self):

1050

return iter(range(len(self)))

1050

return iter(range(len(self)))

1051

1052

def revs(self, start=0, stop=None):

1052

def revs(self, start=0, stop=None):

1053

"""iterate over all rev in this revlog (from start to stop)"""

1053

"""iterate over all rev in this revlog (from start to stop)"""

1054

return storageutil.iterrevs(len(self), start=start, stop=stop)

1054

return storageutil.iterrevs(len(self), start=start, stop=stop)

1055

1056

def hasnode(self, node):

1056

def hasnode(self, node):

1057

try:

1057

try:

1058

self.rev(node)

1058

self.rev(node)

1059

return True

1059

return True

1060

except KeyError:

1060

except KeyError:

1061

return False

1061

return False

1062

1063

def _candelta(self, baserev, rev):

1063

def _candelta(self, baserev, rev):

1064

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1064

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1065

# Disable delta if either rev requires a content-changing flag

1065

# Disable delta if either rev requires a content-changing flag

1066

# processor (ex. LFS). This is because such flag processor can alter

1066

# processor (ex. LFS). This is because such flag processor can alter

1067

# the rawtext content that the delta will be based on, and two clients

1067

# the rawtext content that the delta will be based on, and two clients

1068

# could have a same revlog node with different flags (i.e. different

1068

# could have a same revlog node with different flags (i.e. different

1069

# rawtext contents) and the delta could be incompatible.

1069

# rawtext contents) and the delta could be incompatible.

1070

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1070

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1071

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1071

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1072

):

1072

):

1073

return False

1073

return False

1074

return True

1074

return True

1075

1076

def update_caches(self, transaction):

1076

def update_caches(self, transaction):

1077

"""update on disk cache

1077

"""update on disk cache

1078

1079

If a transaction is passed, the update may be delayed to transaction

1079

If a transaction is passed, the update may be delayed to transaction

1080

commit."""

1080

commit."""

1081

if self._nodemap_file is not None:

1081

if self._nodemap_file is not None:

1082

if transaction is None:

1082

if transaction is None:

1083

nodemaputil.update_persistent_nodemap(self)

1083

nodemaputil.update_persistent_nodemap(self)

1084

else:

1084

else:

1085

nodemaputil.setup_persistent_nodemap(transaction, self)

1085

nodemaputil.setup_persistent_nodemap(transaction, self)

1086

1087

def clearcaches(self):

1087

def clearcaches(self):

1088

"""Clear in-memory caches"""

1088

"""Clear in-memory caches"""

1089

self._revisioncache = None

1089

self._revisioncache = None

1090

self._chainbasecache.clear()

1090

self._chainbasecache.clear()

1091

self._segmentfile.clear_cache()

1091

self._segmentfile.clear_cache()

1092

self._segmentfile_sidedata.clear_cache()

1092

self._segmentfile_sidedata.clear_cache()

1093

self._pcache = {}

1093

self._pcache = {}

1094

self._nodemap_docket = None

1094

self._nodemap_docket = None

1095

self.index.clearcaches()

1095

self.index.clearcaches()

1096

# The python code is the one responsible for validating the docket, we

1096

# The python code is the one responsible for validating the docket, we

1097

# end up having to refresh it here.

1097

# end up having to refresh it here.

1098

use_nodemap = (

1098

use_nodemap = (

1099

not self._inline

1099

not self._inline

1100

and self._nodemap_file is not None

1100

and self._nodemap_file is not None

1101

and hasattr(self.index, 'update_nodemap_data')

1101

and hasattr(self.index, 'update_nodemap_data')

1102

)

1102

)

1103

if use_nodemap:

1103

if use_nodemap:

1104

nodemap_data = nodemaputil.persisted_data(self)

1104

nodemap_data = nodemaputil.persisted_data(self)

1105

if nodemap_data is not None:

1105

if nodemap_data is not None:

1106

self._nodemap_docket = nodemap_data[0]

1106

self._nodemap_docket = nodemap_data[0]

1107

self.index.update_nodemap_data(*nodemap_data)

1107

self.index.update_nodemap_data(*nodemap_data)

1108

1109

def rev(self, node):

1109

def rev(self, node):

1110

"""return the revision number associated with a <nodeid>"""

1110

"""return the revision number associated with a <nodeid>"""

1111

try:

1111

try:

1112

return self.index.rev(node)

1112

return self.index.rev(node)

1113

except TypeError:

1113

except TypeError:

1114

raise

1114

raise

1115

except error.RevlogError:

1115

except error.RevlogError:

1116

# parsers.c radix tree lookup failed

1116

# parsers.c radix tree lookup failed

1117

if (

1117

if (

1118

node == self.nodeconstants.wdirid

1118

node == self.nodeconstants.wdirid

1119

or node in self.nodeconstants.wdirfilenodeids

1119

or node in self.nodeconstants.wdirfilenodeids

1120

):

1120

):

1121

raise error.WdirUnsupported

1121

raise error.WdirUnsupported

1122

raise error.LookupError(node, self.display_id, _(b'no node'))

1122

raise error.LookupError(node, self.display_id, _(b'no node'))

1123

1124

# Accessors for index entries.

1124

# Accessors for index entries.

1125

1126

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1126

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1127

# are flags.

1127

# are flags.

1128

def start(self, rev):

1128

def start(self, rev):

1129

return int(self.index[rev][0] >> 16)

1129

return int(self.index[rev][0] >> 16)

1130

1131

def sidedata_cut_off(self, rev):

1131

def sidedata_cut_off(self, rev):

1132

sd_cut_off = self.index[rev][8]

1132

sd_cut_off = self.index[rev][8]

1133

if sd_cut_off != 0:

1133

if sd_cut_off != 0:

1134

return sd_cut_off

1134

return sd_cut_off

1135

# This is some annoying dance, because entries without sidedata

1135

# This is some annoying dance, because entries without sidedata

1136

# currently use 0 as their ofsset. (instead of previous-offset +

1136

# currently use 0 as their ofsset. (instead of previous-offset +

1137

# previous-size)

1137

# previous-size)

1138

#

1138

#

1139

# We should reconsider this sidedata → 0 sidata_offset policy.

1139

# We should reconsider this sidedata → 0 sidata_offset policy.

1140

# In the meantime, we need this.

1140

# In the meantime, we need this.

1141

while 0 <= rev:

1141

while 0 <= rev:

1142

e = self.index[rev]

1142

e = self.index[rev]

1143

if e[9] != 0:

1143

if e[9] != 0:

1144

return e[8] + e[9]

1144

return e[8] + e[9]

1145

rev -= 1

1145

rev -= 1

1146

return 0

1146

return 0

1147

1148

def flags(self, rev):

1148

def flags(self, rev):

1149

return self.index[rev][0] & 0xFFFF

1149

return self.index[rev][0] & 0xFFFF

1150

1151

def length(self, rev):

1151

def length(self, rev):

1152

return self.index[rev][1]

1152

return self.index[rev][1]

1153

1154

def sidedata_length(self, rev):

1154

def sidedata_length(self, rev):

1155

if not self.hassidedata:

1155

if not self.hassidedata:

1156

return 0

1156

return 0

1157

return self.index[rev][9]

1157

return self.index[rev][9]

1158

1159

def rawsize(self, rev):

1159

def rawsize(self, rev):

1160

"""return the length of the uncompressed text for a given revision"""

1160

"""return the length of the uncompressed text for a given revision"""

1161

l = self.index[rev][2]

1161

l = self.index[rev][2]

1162

if l >= 0:

1162

if l >= 0:

1163

return l

1163

return l

1164

1165

t = self.rawdata(rev)

1165

t = self.rawdata(rev)

1166

return len(t)

1166

return len(t)

1167

1168

def size(self, rev):

1168

def size(self, rev):

1169

"""length of non-raw text (processed by a "read" flag processor)"""

1169

"""length of non-raw text (processed by a "read" flag processor)"""

1170

# fast path: if no "read" flag processor could change the content,

1170

# fast path: if no "read" flag processor could change the content,

1171

# size is rawsize. note: ELLIPSIS is known to not change the content.

1171

# size is rawsize. note: ELLIPSIS is known to not change the content.

1172

flags = self.flags(rev)

1172

flags = self.flags(rev)

1173

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1173

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1174

return self.rawsize(rev)

1174

return self.rawsize(rev)

1175

1176

return len(self.revision(rev))

1176

return len(self.revision(rev))

1177

1178

def fast_rank(self, rev):

1178

def fast_rank(self, rev):

1179

"""Return the rank of a revision if already known, or None otherwise.

1179

"""Return the rank of a revision if already known, or None otherwise.

1180

1181

The rank of a revision is the size of the sub-graph it defines as a

1181

The rank of a revision is the size of the sub-graph it defines as a

1182

head. Equivalently, the rank of a revision `r` is the size of the set

1182

head. Equivalently, the rank of a revision `r` is the size of the set

1183

`ancestors(r)`, `r` included.

1183

`ancestors(r)`, `r` included.

1184

1185

This method returns the rank retrieved from the revlog in constant

1185

This method returns the rank retrieved from the revlog in constant

1186

time. It makes no attempt at computing unknown values for versions of

1186

time. It makes no attempt at computing unknown values for versions of

1187

the revlog which do not persist the rank.

1187

the revlog which do not persist the rank.

1188

"""

1188

"""

1189

rank = self.index[rev][ENTRY_RANK]

1189

rank = self.index[rev][ENTRY_RANK]

1190

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1190

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1191

return None

1191

return None

1192

if rev == nullrev:

1192

if rev == nullrev:

1193

return 0 # convention

1193

return 0 # convention

1194

return rank

1194

return rank

1195

1196

def chainbase(self, rev):

1196

def chainbase(self, rev):

1197

base = self._chainbasecache.get(rev)

1197

base = self._chainbasecache.get(rev)

1198

if base is not None:

1198

if base is not None:

1199

return base

1199

return base

1200

1201

index = self.index

1201

index = self.index

1202

iterrev = rev

1202

iterrev = rev

1203

base = index[iterrev][3]

1203

base = index[iterrev][3]

1204

while base != iterrev:

1204

while base != iterrev:

1205

iterrev = base

1205

iterrev = base

1206

base = index[iterrev][3]

1206

base = index[iterrev][3]

1207

1208

self._chainbasecache[rev] = base

1208

self._chainbasecache[rev] = base

1209

return base

1209

return base

1210

1211

def linkrev(self, rev):

1211

def linkrev(self, rev):

1212

return self.index[rev][4]

1212

return self.index[rev][4]

1213

1214

def parentrevs(self, rev):

1214

def parentrevs(self, rev):

1215

try:

1215

try:

1216

entry = self.index[rev]

1216

entry = self.index[rev]

1217

except IndexError:

1217

except IndexError:

1218

if rev == wdirrev:

1218

if rev == wdirrev:

1219

raise error.WdirUnsupported

1219

raise error.WdirUnsupported

1220

raise

1220

raise

1221

1222

if self.canonical_parent_order and entry[5] == nullrev:

1222

if self.canonical_parent_order and entry[5] == nullrev:

1223

return entry[6], entry[5]

1223

return entry[6], entry[5]

1224

else:

1224

else:

1225

return entry[5], entry[6]

1225

return entry[5], entry[6]

1226

1227

# fast parentrevs(rev) where rev isn't filtered

1227

# fast parentrevs(rev) where rev isn't filtered

1228

_uncheckedparentrevs = parentrevs

1228

_uncheckedparentrevs = parentrevs

1229

1230

def node(self, rev):

1230

def node(self, rev):

1231

try:

1231

try:

1232

return self.index[rev][7]

1232

return self.index[rev][7]

1233

except IndexError:

1233

except IndexError:

1234

if rev == wdirrev:

1234

if rev == wdirrev:

1235

raise error.WdirUnsupported

1235

raise error.WdirUnsupported

1236

raise

1236

raise

1237

1238

# Derived from index values.

1238

# Derived from index values.

1239

1240

def end(self, rev):

1240

def end(self, rev):

1241

return self.start(rev) + self.length(rev)

1241

return self.start(rev) + self.length(rev)

1242

1243

def parents(self, node):

1243

def parents(self, node):

1244

i = self.index

1244

i = self.index

1245

d = i[self.rev(node)]

1245

d = i[self.rev(node)]

1246

# inline node() to avoid function call overhead

1246

# inline node() to avoid function call overhead

1247

if self.canonical_parent_order and d[5] == self.nullid:

1247

if self.canonical_parent_order and d[5] == self.nullid:

1248

return i[d[6]][7], i[d[5]][7]

1248

return i[d[6]][7], i[d[5]][7]

1249

else:

1249

else:

1250

return i[d[5]][7], i[d[6]][7]

1250

return i[d[5]][7], i[d[6]][7]

1251

1252

def chainlen(self, rev):

1252

def chainlen(self, rev):

1253

return self._chaininfo(rev)[0]

1253

return self._chaininfo(rev)[0]

1254

1255

def _chaininfo(self, rev):

1255

def _chaininfo(self, rev):

1256

chaininfocache = self._chaininfocache

1256

chaininfocache = self._chaininfocache

1257

if rev in chaininfocache:

1257

if rev in chaininfocache:

1258

return chaininfocache[rev]

1258

return chaininfocache[rev]

1259

index = self.index

1259

index = self.index

1260

generaldelta = self.delta_config.general_delta

1260

generaldelta = self.delta_config.general_delta

1261

iterrev = rev

1261

iterrev = rev

1262

e = index[iterrev]

1262

e = index[iterrev]

1263

clen = 0

1263

clen = 0

1264

compresseddeltalen = 0

1264

compresseddeltalen = 0

1265

while iterrev != e[3]:

1265

while iterrev != e[3]:

1266

clen += 1

1266

clen += 1

1267

compresseddeltalen += e[1]

1267

compresseddeltalen += e[1]

1268

if generaldelta:

1268

if generaldelta:

1269

iterrev = e[3]

1269

iterrev = e[3]

1270

else:

1270

else:

1271

iterrev -= 1

1271

iterrev -= 1

1272

if iterrev in chaininfocache:

1272

if iterrev in chaininfocache:

1273

t = chaininfocache[iterrev]

1273

t = chaininfocache[iterrev]

1274

clen += t[0]

1274

clen += t[0]

1275

compresseddeltalen += t[1]

1275

compresseddeltalen += t[1]

1276

break

1276

break

1277

e = index[iterrev]

1277

e = index[iterrev]

1278

else:

1278

else:

1279

# Add text length of base since decompressing that also takes

1279

# Add text length of base since decompressing that also takes

1280

# work. For cache hits the length is already included.

1280

# work. For cache hits the length is already included.

1281

compresseddeltalen += e[1]

1281

compresseddeltalen += e[1]

1282

r = (clen, compresseddeltalen)

1282

r = (clen, compresseddeltalen)

1283

chaininfocache[rev] = r

1283

chaininfocache[rev] = r

1284

return r

1284

return r

1285

1286

def _deltachain(self, rev, stoprev=None):

1286

def _deltachain(self, rev, stoprev=None):

1287

"""Obtain the delta chain for a revision.

1287

"""Obtain the delta chain for a revision.

1288

1289

``stoprev`` specifies a revision to stop at. If not specified, we

1289

``stoprev`` specifies a revision to stop at. If not specified, we

1290

stop at the base of the chain.

1290

stop at the base of the chain.

1291

1292

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

1292

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

1293

revs in ascending order and ``stopped`` is a bool indicating whether

1293

revs in ascending order and ``stopped`` is a bool indicating whether

1294

``stoprev`` was hit.

1294

``stoprev`` was hit.

1295

"""

1295

"""

1296

generaldelta = self.delta_config.general_delta

1296

generaldelta = self.delta_config.general_delta

1297

# Try C implementation.

1297

# Try C implementation.

1298

try:

1298

try:

1299

return self.index.deltachain(rev, stoprev, generaldelta)

1299

return self.index.deltachain(rev, stoprev, generaldelta)

1300

except AttributeError:

1300

except AttributeError:

1301

pass

1301

pass

1302

1303

chain = []

1303

chain = []

1304

1305

# Alias to prevent attribute lookup in tight loop.

1305

# Alias to prevent attribute lookup in tight loop.

1306

index = self.index

1306

index = self.index

1307

1308

iterrev = rev

1308

iterrev = rev

1309

e = index[iterrev]

1309

e = index[iterrev]

1310

while iterrev != e[3] and iterrev != stoprev:

1310

while iterrev != e[3] and iterrev != stoprev:

1311

chain.append(iterrev)

1311

chain.append(iterrev)

1312

if generaldelta:

1312

if generaldelta:

1313

iterrev = e[3]

1313

iterrev = e[3]

1314

else:

1314

else:

1315

iterrev -= 1

1315

iterrev -= 1

1316

e = index[iterrev]

1316

e = index[iterrev]

1317

1318

if iterrev == stoprev:

1318

if iterrev == stoprev:

1319

stopped = True

1319

stopped = True

1320

else:

1320

else:

1321

chain.append(iterrev)

1321

chain.append(iterrev)

1322

stopped = False

1322

stopped = False

1323

1324

chain.reverse()

1324

chain.reverse()

1325

return chain, stopped

1325

return chain, stopped

1326

1327

def ancestors(self, revs, stoprev=0, inclusive=False):

1327

def ancestors(self, revs, stoprev=0, inclusive=False):

1328

"""Generate the ancestors of 'revs' in reverse revision order.

1328

"""Generate the ancestors of 'revs' in reverse revision order.

1329

Does not generate revs lower than stoprev.

1329

Does not generate revs lower than stoprev.

1330

1331

See the documentation for ancestor.lazyancestors for more details."""

1331

See the documentation for ancestor.lazyancestors for more details."""

1332

1333

# first, make sure start revisions aren't filtered

1333

# first, make sure start revisions aren't filtered

1334

revs = list(revs)

1334

revs = list(revs)

1335

checkrev = self.node

1335

checkrev = self.node

1336

for r in revs:

1336

for r in revs:

1337

checkrev(r)

1337

checkrev(r)

1338

# and we're sure ancestors aren't filtered as well

1338

# and we're sure ancestors aren't filtered as well

1339

1340

if rustancestor is not None and self.index.rust_ext_compat:

1340

if rustancestor is not None and self.index.rust_ext_compat:

1341

lazyancestors = rustancestor.LazyAncestors

1341

lazyancestors = rustancestor.LazyAncestors

1342

arg = self.index

1342

arg = self.index

1343

else:

1343

else:

1344

lazyancestors = ancestor.lazyancestors

1344

lazyancestors = ancestor.lazyancestors

1345

arg = self._uncheckedparentrevs

1345

arg = self._uncheckedparentrevs

1346

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

1346

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

1347

1348

def descendants(self, revs):

1348

def descendants(self, revs):

1349

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

1349

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

1350

1351

def findcommonmissing(self, common=None, heads=None):

1351

def findcommonmissing(self, common=None, heads=None):

1352

"""Return a tuple of the ancestors of common and the ancestors of heads

1352

"""Return a tuple of the ancestors of common and the ancestors of heads

1353

that are not ancestors of common. In revset terminology, we return the

1353

that are not ancestors of common. In revset terminology, we return the

1354

tuple:

1354

tuple:

1355

1356

::common, (::heads) - (::common)

1356

::common, (::heads) - (::common)

1357

1358

The list is sorted by revision number, meaning it is

1358

The list is sorted by revision number, meaning it is

1359

topologically sorted.

1359

topologically sorted.

1360

1361

'heads' and 'common' are both lists of node IDs. If heads is

1361

'heads' and 'common' are both lists of node IDs. If heads is

1362

not supplied, uses all of the revlog's heads. If common is not

1362

not supplied, uses all of the revlog's heads. If common is not

1363

supplied, uses nullid."""

1363

supplied, uses nullid."""

1364

if common is None:

1364

if common is None:

1365

common = [self.nullid]

1365

common = [self.nullid]

1366

if heads is None:

1366

if heads is None:

1367

heads = self.heads()

1367

heads = self.heads()

1368

1369

common = [self.rev(n) for n in common]

1369

common = [self.rev(n) for n in common]

1370

heads = [self.rev(n) for n in heads]

1370

heads = [self.rev(n) for n in heads]

1371

1372

# we want the ancestors, but inclusive

1372

# we want the ancestors, but inclusive

1373

class lazyset:

1373

class lazyset:

1374

def __init__(self, lazyvalues):

1374

def __init__(self, lazyvalues):

1375

self.addedvalues = set()

1375

self.addedvalues = set()

1376

self.lazyvalues = lazyvalues

1376

self.lazyvalues = lazyvalues

1377

1378

def __contains__(self, value):

1378

def __contains__(self, value):

1379

return value in self.addedvalues or value in self.lazyvalues

1379

return value in self.addedvalues or value in self.lazyvalues

1380

1381

def __iter__(self):

1381

def __iter__(self):

1382

added = self.addedvalues

1382

added = self.addedvalues

1383

for r in added:

1383

for r in added:

1384

yield r

1384

yield r

1385

for r in self.lazyvalues:

1385

for r in self.lazyvalues:

1386

if not r in added:

1386

if not r in added:

1387

yield r

1387

yield r

1388

1389

def add(self, value):

1389

def add(self, value):

1390

self.addedvalues.add(value)

1390

self.addedvalues.add(value)

1391

1392

def update(self, values):

1392

def update(self, values):

1393

self.addedvalues.update(values)

1393

self.addedvalues.update(values)

1394

1395

has = lazyset(self.ancestors(common))

1395

has = lazyset(self.ancestors(common))

1396

has.add(nullrev)

1396

has.add(nullrev)

1397

has.update(common)

1397

has.update(common)

1398

1399

# take all ancestors from heads that aren't in has

1399

# take all ancestors from heads that aren't in has

1400

missing = set()

1400

missing = set()

1401

visit = collections.deque(r for r in heads if r not in has)

1401

visit = collections.deque(r for r in heads if r not in has)

1402

while visit:

1402

while visit:

1403

r = visit.popleft()

1403

r = visit.popleft()

1404

if r in missing:

1404

if r in missing:

1405

continue

1405

continue

1406

else:

1406

else:

1407

missing.add(r)

1407

missing.add(r)

1408

for p in self.parentrevs(r):

1408

for p in self.parentrevs(r):

1409

if p not in has:

1409

if p not in has:

1410

visit.append(p)

1410

visit.append(p)

1411

missing = list(missing)

1411

missing = list(missing)

1412

missing.sort()

1412

missing.sort()

1413

return has, [self.node(miss) for miss in missing]

1413

return has, [self.node(miss) for miss in missing]

1414

1415

def incrementalmissingrevs(self, common=None):

1415

def incrementalmissingrevs(self, common=None):

1416

"""Return an object that can be used to incrementally compute the

1416

"""Return an object that can be used to incrementally compute the

1417

revision numbers of the ancestors of arbitrary sets that are not

1417

revision numbers of the ancestors of arbitrary sets that are not

1418

ancestors of common. This is an ancestor.incrementalmissingancestors

1418

ancestors of common. This is an ancestor.incrementalmissingancestors

1419

object.

1419

object.

1420

1421

'common' is a list of revision numbers. If common is not supplied, uses

1421

'common' is a list of revision numbers. If common is not supplied, uses

1422

nullrev.

1422

nullrev.

1423

"""

1423

"""

1424

if common is None:

1424

if common is None:

1425

common = [nullrev]

1425

common = [nullrev]

1426

1427

if rustancestor is not None and self.index.rust_ext_compat:

1427

if rustancestor is not None and self.index.rust_ext_compat:

1428

return rustancestor.MissingAncestors(self.index, common)

1428

return rustancestor.MissingAncestors(self.index, common)

1429

return ancestor.incrementalmissingancestors(self.parentrevs, common)

1429

return ancestor.incrementalmissingancestors(self.parentrevs, common)

1430

1431

def findmissingrevs(self, common=None, heads=None):

1431

def findmissingrevs(self, common=None, heads=None):

1432

"""Return the revision numbers of the ancestors of heads that

1432

"""Return the revision numbers of the ancestors of heads that

1433

are not ancestors of common.

1433

are not ancestors of common.

1434

1435

More specifically, return a list of revision numbers corresponding to

1435

More specifically, return a list of revision numbers corresponding to

1436

nodes N such that every N satisfies the following constraints:

1436

nodes N such that every N satisfies the following constraints:

1437

1438

1. N is an ancestor of some node in 'heads'

1438

1. N is an ancestor of some node in 'heads'

1439

2. N is not an ancestor of any node in 'common'

1439

2. N is not an ancestor of any node in 'common'

1440

1441

The list is sorted by revision number, meaning it is

1441

The list is sorted by revision number, meaning it is

1442

topologically sorted.

1442

topologically sorted.

1443

1444

'heads' and 'common' are both lists of revision numbers. If heads is

1444

'heads' and 'common' are both lists of revision numbers. If heads is

1445

not supplied, uses all of the revlog's heads. If common is not

1445

not supplied, uses all of the revlog's heads. If common is not

1446

supplied, uses nullid."""

1446

supplied, uses nullid."""

1447

if common is None:

1447

if common is None:

1448

common = [nullrev]

1448

common = [nullrev]

1449

if heads is None:

1449

if heads is None:

1450

heads = self.headrevs()

1450

heads = self.headrevs()

1451

1452

inc = self.incrementalmissingrevs(common=common)

1452

inc = self.incrementalmissingrevs(common=common)

1453

return inc.missingancestors(heads)

1453

return inc.missingancestors(heads)

1454

1455

def findmissing(self, common=None, heads=None):

1455

def findmissing(self, common=None, heads=None):

1456

"""Return the ancestors of heads that are not ancestors of common.

1456

"""Return the ancestors of heads that are not ancestors of common.

1457

1458

More specifically, return a list of nodes N such that every N

1458

More specifically, return a list of nodes N such that every N

1459

satisfies the following constraints:

1459

satisfies the following constraints:

1460

1461

1. N is an ancestor of some node in 'heads'

1461

1. N is an ancestor of some node in 'heads'

1462

2. N is not an ancestor of any node in 'common'

1462

2. N is not an ancestor of any node in 'common'

1463

1464

The list is sorted by revision number, meaning it is

1464

The list is sorted by revision number, meaning it is

1465

topologically sorted.

1465

topologically sorted.

1466

1467

'heads' and 'common' are both lists of node IDs. If heads is

1467

'heads' and 'common' are both lists of node IDs. If heads is

1468

not supplied, uses all of the revlog's heads. If common is not

1468

not supplied, uses all of the revlog's heads. If common is not

1469

supplied, uses nullid."""

1469

supplied, uses nullid."""

1470

if common is None:

1470

if common is None:

1471

common = [self.nullid]

1471

common = [self.nullid]

1472

if heads is None:

1472

if heads is None:

1473

heads = self.heads()

1473

heads = self.heads()

1474

1475

common = [self.rev(n) for n in common]

1475

common = [self.rev(n) for n in common]

1476

heads = [self.rev(n) for n in heads]

1476

heads = [self.rev(n) for n in heads]

1477

1478

inc = self.incrementalmissingrevs(common=common)

1478

inc = self.incrementalmissingrevs(common=common)

1479

return [self.node(r) for r in inc.missingancestors(heads)]

1479

return [self.node(r) for r in inc.missingancestors(heads)]

1480

1481

def nodesbetween(self, roots=None, heads=None):

1481

def nodesbetween(self, roots=None, heads=None):

1482

"""Return a topological path from 'roots' to 'heads'.

1482

"""Return a topological path from 'roots' to 'heads'.

1483

1484

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

1484

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

1485

topologically sorted list of all nodes N that satisfy both of

1485

topologically sorted list of all nodes N that satisfy both of

1486

these constraints:

1486

these constraints:

1487

1488

1. N is a descendant of some node in 'roots'

1488

1. N is a descendant of some node in 'roots'

1489

2. N is an ancestor of some node in 'heads'

1489

2. N is an ancestor of some node in 'heads'

1490

1491

Every node is considered to be both a descendant and an ancestor

1491

Every node is considered to be both a descendant and an ancestor

1492

of itself, so every reachable node in 'roots' and 'heads' will be

1492

of itself, so every reachable node in 'roots' and 'heads' will be

1493

included in 'nodes'.

1493

included in 'nodes'.

1494

1495

'outroots' is the list of reachable nodes in 'roots', i.e., the

1495

'outroots' is the list of reachable nodes in 'roots', i.e., the

1496

subset of 'roots' that is returned in 'nodes'. Likewise,

1496

subset of 'roots' that is returned in 'nodes'. Likewise,

1497

'outheads' is the subset of 'heads' that is also in 'nodes'.

1497

'outheads' is the subset of 'heads' that is also in 'nodes'.

1498

1499

'roots' and 'heads' are both lists of node IDs. If 'roots' is

1499

'roots' and 'heads' are both lists of node IDs. If 'roots' is

1500

unspecified, uses nullid as the only root. If 'heads' is

1500

unspecified, uses nullid as the only root. If 'heads' is

1501

unspecified, uses list of all of the revlog's heads."""

1501

unspecified, uses list of all of the revlog's heads."""

1502

nonodes = ([], [], [])

1502

nonodes = ([], [], [])

1503

if roots is not None:

1503

if roots is not None:

1504

roots = list(roots)

1504

roots = list(roots)

1505

if not roots:

1505

if not roots:

1506

return nonodes

1506

return nonodes

1507

lowestrev = min([self.rev(n) for n in roots])

1507

lowestrev = min([self.rev(n) for n in roots])

1508

else:

1508

else:

1509

roots = [self.nullid] # Everybody's a descendant of nullid

1509

roots = [self.nullid] # Everybody's a descendant of nullid

1510

lowestrev = nullrev

1510

lowestrev = nullrev

1511

if (lowestrev == nullrev) and (heads is None):

1511

if (lowestrev == nullrev) and (heads is None):

1512

# We want _all_ the nodes!

1512

# We want _all_ the nodes!

1513

return (

1513

return (

1514

[self.node(r) for r in self],

1514

[self.node(r) for r in self],

1515

[self.nullid],

1515

[self.nullid],

1516

list(self.heads()),

1516

list(self.heads()),

1517

)

1517

)

1518

if heads is None:

1518

if heads is None:

1519

# All nodes are ancestors, so the latest ancestor is the last

1519

# All nodes are ancestors, so the latest ancestor is the last

1520

# node.

1520

# node.

1521

highestrev = len(self) - 1

1521

highestrev = len(self) - 1

1522

# Set ancestors to None to signal that every node is an ancestor.

1522

# Set ancestors to None to signal that every node is an ancestor.

1523

ancestors = None

1523

ancestors = None

1524

# Set heads to an empty dictionary for later discovery of heads

1524

# Set heads to an empty dictionary for later discovery of heads

1525

heads = {}

1525

heads = {}

1526

else:

1526

else:

1527

heads = list(heads)

1527

heads = list(heads)

1528

if not heads:

1528

if not heads:

1529

return nonodes

1529

return nonodes

1530

ancestors = set()

1530

ancestors = set()

1531

# Turn heads into a dictionary so we can remove 'fake' heads.

1531

# Turn heads into a dictionary so we can remove 'fake' heads.

1532

# Also, later we will be using it to filter out the heads we can't

1532

# Also, later we will be using it to filter out the heads we can't

1533

# find from roots.

1533

# find from roots.

1534

heads = dict.fromkeys(heads, False)

1534

heads = dict.fromkeys(heads, False)

1535

# Start at the top and keep marking parents until we're done.

1535

# Start at the top and keep marking parents until we're done.

1536

nodestotag = set(heads)

1536

nodestotag = set(heads)

1537

# Remember where the top was so we can use it as a limit later.

1537

# Remember where the top was so we can use it as a limit later.

1538

highestrev = max([self.rev(n) for n in nodestotag])

1538

highestrev = max([self.rev(n) for n in nodestotag])

1539

while nodestotag:

1539

while nodestotag:

1540

# grab a node to tag

1540

# grab a node to tag

1541

n = nodestotag.pop()

1541

n = nodestotag.pop()

1542

# Never tag nullid

1542

# Never tag nullid

1543

if n == self.nullid:

1543

if n == self.nullid:

1544

continue

1544

continue

1545

# A node's revision number represents its place in a

1545

# A node's revision number represents its place in a

1546

# topologically sorted list of nodes.

1546

# topologically sorted list of nodes.

1547

r = self.rev(n)

1547

r = self.rev(n)

1548

if r >= lowestrev:

1548

if r >= lowestrev:

1549

if n not in ancestors:

1549

if n not in ancestors:

1550

# If we are possibly a descendant of one of the roots

1550

# If we are possibly a descendant of one of the roots

1551

# and we haven't already been marked as an ancestor

1551

# and we haven't already been marked as an ancestor

1552

ancestors.add(n) # Mark as ancestor

1552

ancestors.add(n) # Mark as ancestor

1553

# Add non-nullid parents to list of nodes to tag.

1553

# Add non-nullid parents to list of nodes to tag.

1554

nodestotag.update(

1554

nodestotag.update(

1555

[p for p in self.parents(n) if p != self.nullid]

1555

[p for p in self.parents(n) if p != self.nullid]

1556

)

1556

)

1557

elif n in heads: # We've seen it before, is it a fake head?

1557

elif n in heads: # We've seen it before, is it a fake head?

1558

# So it is, real heads should not be the ancestors of

1558

# So it is, real heads should not be the ancestors of

1559

# any other heads.

1559

# any other heads.

1560

heads.pop(n)

1560

heads.pop(n)

1561

if not ancestors:

1561

if not ancestors:

1562

return nonodes

1562

return nonodes

1563

# Now that we have our set of ancestors, we want to remove any

1563

# Now that we have our set of ancestors, we want to remove any

1564

# roots that are not ancestors.

1564

# roots that are not ancestors.

1565

1566

# If one of the roots was nullid, everything is included anyway.

1566

# If one of the roots was nullid, everything is included anyway.

1567

if lowestrev > nullrev:

1567

if lowestrev > nullrev:

1568

# But, since we weren't, let's recompute the lowest rev to not

1568

# But, since we weren't, let's recompute the lowest rev to not

1569

# include roots that aren't ancestors.

1569

# include roots that aren't ancestors.

1570

1571

# Filter out roots that aren't ancestors of heads

1571

# Filter out roots that aren't ancestors of heads

1572

roots = [root for root in roots if root in ancestors]

1572

roots = [root for root in roots if root in ancestors]

1573

# Recompute the lowest revision

1573

# Recompute the lowest revision

1574

if roots:

1574

if roots:

1575

lowestrev = min([self.rev(root) for root in roots])

1575

lowestrev = min([self.rev(root) for root in roots])

1576

else:

1576

else:

1577

# No more roots? Return empty list

1577

# No more roots? Return empty list

1578

return nonodes

1578

return nonodes

1579

else:

1579

else:

1580

# We are descending from nullid, and don't need to care about

1580

# We are descending from nullid, and don't need to care about

1581

# any other roots.

1581

# any other roots.

1582

lowestrev = nullrev

1582

lowestrev = nullrev

1583

roots = [self.nullid]

1583

roots = [self.nullid]

1584

# Transform our roots list into a set.

1584

# Transform our roots list into a set.

1585

descendants = set(roots)

1585

descendants = set(roots)

1586

# Also, keep the original roots so we can filter out roots that aren't

1586

# Also, keep the original roots so we can filter out roots that aren't

1587

# 'real' roots (i.e. are descended from other roots).

1587

# 'real' roots (i.e. are descended from other roots).

1588

roots = descendants.copy()

1588

roots = descendants.copy()

1589

# Our topologically sorted list of output nodes.

1589

# Our topologically sorted list of output nodes.

1590

orderedout = []

1590

orderedout = []

1591

# Don't start at nullid since we don't want nullid in our output list,

1591

# Don't start at nullid since we don't want nullid in our output list,

1592

# and if nullid shows up in descendants, empty parents will look like

1592

# and if nullid shows up in descendants, empty parents will look like

1593

# they're descendants.

1593

# they're descendants.

1594

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

1594

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

1595

n = self.node(r)

1595

n = self.node(r)

1596

isdescendant = False

1596

isdescendant = False

1597

if lowestrev == nullrev: # Everybody is a descendant of nullid

1597

if lowestrev == nullrev: # Everybody is a descendant of nullid

1598

isdescendant = True

1598

isdescendant = True

1599

elif n in descendants:

1599

elif n in descendants:

1600

# n is already a descendant

1600

# n is already a descendant

1601

isdescendant = True

1601

isdescendant = True

1602

# This check only needs to be done here because all the roots

1602

# This check only needs to be done here because all the roots

1603

# will start being marked is descendants before the loop.

1603

# will start being marked is descendants before the loop.

1604

if n in roots:

1604

if n in roots:

1605

# If n was a root, check if it's a 'real' root.

1605

# If n was a root, check if it's a 'real' root.

1606

p = tuple(self.parents(n))

1606

p = tuple(self.parents(n))

1607

# If any of its parents are descendants, it's not a root.

1607

# If any of its parents are descendants, it's not a root.

1608

if (p[0] in descendants) or (p[1] in descendants):

1608

if (p[0] in descendants) or (p[1] in descendants):

1609

roots.remove(n)

1609

roots.remove(n)

1610

else:

1610

else:

1611

p = tuple(self.parents(n))

1611

p = tuple(self.parents(n))

1612

# A node is a descendant if either of its parents are

1612

# A node is a descendant if either of its parents are

1613

# descendants. (We seeded the dependents list with the roots

1613

# descendants. (We seeded the dependents list with the roots

1614

# up there, remember?)

1614

# up there, remember?)

1615

if (p[0] in descendants) or (p[1] in descendants):

1615

if (p[0] in descendants) or (p[1] in descendants):

1616

descendants.add(n)

1616

descendants.add(n)

1617

isdescendant = True

1617

isdescendant = True

1618

if isdescendant and ((ancestors is None) or (n in ancestors)):

1618

if isdescendant and ((ancestors is None) or (n in ancestors)):

1619

# Only include nodes that are both descendants and ancestors.

1619

# Only include nodes that are both descendants and ancestors.

1620

orderedout.append(n)

1620

orderedout.append(n)

1621

if (ancestors is not None) and (n in heads):

1621

if (ancestors is not None) and (n in heads):

1622

# We're trying to figure out which heads are reachable

1622

# We're trying to figure out which heads are reachable

1623

# from roots.

1623

# from roots.

1624

# Mark this head as having been reached

1624

# Mark this head as having been reached

1625

heads[n] = True

1625

heads[n] = True

1626

elif ancestors is None:

1626

elif ancestors is None:

1627

# Otherwise, we're trying to discover the heads.

1627

# Otherwise, we're trying to discover the heads.

1628

# Assume this is a head because if it isn't, the next step

1628

# Assume this is a head because if it isn't, the next step

1629

# will eventually remove it.

1629

# will eventually remove it.

1630

heads[n] = True

1630

heads[n] = True

1631

# But, obviously its parents aren't.

1631

# But, obviously its parents aren't.

1632

for p in self.parents(n):

1632

for p in self.parents(n):

1633

heads.pop(p, None)

1633

heads.pop(p, None)

1634

heads = [head for head, flag in heads.items() if flag]

1634

heads = [head for head, flag in heads.items() if flag]

1635

roots = list(roots)

1635

roots = list(roots)

1636

assert orderedout

1636

assert orderedout

1637

assert roots

1637

assert roots

1638

assert heads

1638

assert heads

1639

return (orderedout, roots, heads)

1639

return (orderedout, roots, heads)

1640

1641

def headrevs(self, revs=None):

1641

def headrevs(self, revs=None):

1642

if revs is None:

1642

if revs is None:

1643

try:

1643

try:

1644

return self.index.headrevs()

1644

return self.index.headrevs()

1645

except AttributeError:

1645

except AttributeError:

1646

return self._headrevs()

1646

return self._headrevs()

1647

if rustdagop is not None and self.index.rust_ext_compat:

1647

if rustdagop is not None and self.index.rust_ext_compat:

1648

return rustdagop.headrevs(self.index, revs)

1648

return rustdagop.headrevs(self.index, revs)

1649

return dagop.headrevs(revs, self._uncheckedparentrevs)

1649

return dagop.headrevs(revs, self._uncheckedparentrevs)

1650

1651

def computephases(self, roots):

1651

def computephases(self, roots):

1652

return self.index.computephasesmapsets(roots)

1652

return self.index.computephasesmapsets(roots)

1653

1654

def _headrevs(self):

1654

def _headrevs(self):

1655

count = len(self)

1655

count = len(self)

1656

if not count:

1656

if not count:

1657

return [nullrev]

1657

return [nullrev]

1658

# we won't iter over filtered rev so nobody is a head at start

1658

# we won't iter over filtered rev so nobody is a head at start

1659

ishead = [0] * (count + 1)

1659

ishead = [0] * (count + 1)

1660

index = self.index

1660

index = self.index

1661

for r in self:

1661

for r in self:

1662

ishead[r] = 1 # I may be an head

1662

ishead[r] = 1 # I may be an head

1663

e = index[r]

1663

e = index[r]

1664

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

1664

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

1665

return [r for r, val in enumerate(ishead) if val]

1665

return [r for r, val in enumerate(ishead) if val]

1666

1667

def heads(self, start=None, stop=None):

1667

def heads(self, start=None, stop=None):

1668

"""return the list of all nodes that have no children

1668

"""return the list of all nodes that have no children

1669

1670

if start is specified, only heads that are descendants of

1670

if start is specified, only heads that are descendants of

1671

start will be returned

1671

start will be returned

1672

if stop is specified, it will consider all the revs from stop

1672

if stop is specified, it will consider all the revs from stop

1673

as if they had no children

1673

as if they had no children

1674

"""

1674

"""

1675

if start is None and stop is None:

1675

if start is None and stop is None:

1676

if not len(self):

1676

if not len(self):

1677

return [self.nullid]

1677

return [self.nullid]

1678

return [self.node(r) for r in self.headrevs()]

1678

return [self.node(r) for r in self.headrevs()]

1679

1680

if start is None:

1680

if start is None:

1681

start = nullrev

1681

start = nullrev

1682

else:

1682

else:

1683

start = self.rev(start)

1683

start = self.rev(start)

1684

1685

stoprevs = {self.rev(n) for n in stop or []}

1685

stoprevs = {self.rev(n) for n in stop or []}

1686

1687

revs = dagop.headrevssubset(

1687

revs = dagop.headrevssubset(

1688

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

1688

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

1689

)

1689

)

1690

1691

return [self.node(rev) for rev in revs]

1691

return [self.node(rev) for rev in revs]

1692

1693

def children(self, node):

1693

def children(self, node):

1694

"""find the children of a given node"""

1694

"""find the children of a given node"""

1695

c = []

1695

c = []

1696

p = self.rev(node)

1696

p = self.rev(node)

1697

for r in self.revs(start=p + 1):

1697

for r in self.revs(start=p + 1):

1698

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

1698

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

1699

if prevs:

1699

if prevs:

1700

for pr in prevs:

1700

for pr in prevs:

1701

if pr == p:

1701

if pr == p:

1702

c.append(self.node(r))

1702

c.append(self.node(r))

1703

elif p == nullrev:

1703

elif p == nullrev:

1704

c.append(self.node(r))

1704

c.append(self.node(r))

1705

return c

1705

return c

1706

1707

def commonancestorsheads(self, a, b):

1707

def commonancestorsheads(self, a, b):

1708

"""calculate all the heads of the common ancestors of nodes a and b"""

1708

"""calculate all the heads of the common ancestors of nodes a and b"""

1709

a, b = self.rev(a), self.rev(b)

1709

a, b = self.rev(a), self.rev(b)

1710

ancs = self._commonancestorsheads(a, b)

1710

ancs = self._commonancestorsheads(a, b)

1711

return pycompat.maplist(self.node, ancs)

1711

return pycompat.maplist(self.node, ancs)

1712

1713

def _commonancestorsheads(self, *revs):

1713

def _commonancestorsheads(self, *revs):

1714

"""calculate all the heads of the common ancestors of revs"""

1714

"""calculate all the heads of the common ancestors of revs"""

1715

try:

1715

try:

1716

ancs = self.index.commonancestorsheads(*revs)

1716

ancs = self.index.commonancestorsheads(*revs)

1717

except (AttributeError, OverflowError): # C implementation failed

1717

except (AttributeError, OverflowError): # C implementation failed

1718

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

1718

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

1719

return ancs

1719

return ancs

1720

1721

def isancestor(self, a, b):

1721

def isancestor(self, a, b):

1722

"""return True if node a is an ancestor of node b

1722

"""return True if node a is an ancestor of node b

1723

1724

A revision is considered an ancestor of itself."""

1724

A revision is considered an ancestor of itself."""

1725

a, b = self.rev(a), self.rev(b)

1725

a, b = self.rev(a), self.rev(b)

1726

return self.isancestorrev(a, b)

1726

return self.isancestorrev(a, b)

1727

1728

def isancestorrev(self, a, b):

1728

def isancestorrev(self, a, b):

1729

"""return True if revision a is an ancestor of revision b

1729

"""return True if revision a is an ancestor of revision b

1730

1731

A revision is considered an ancestor of itself.

1731

A revision is considered an ancestor of itself.

1732

1733

The implementation of this is trivial but the use of

1733

The implementation of this is trivial but the use of

1734

reachableroots is not."""

1734

reachableroots is not."""

1735

if a == nullrev:

1735

if a == nullrev:

1736

return True

1736

return True

1737

elif a == b:

1737

elif a == b:

1738

return True

1738

return True

1739

elif a > b:

1739

elif a > b:

1740

return False

1740

return False

1741

return bool(self.reachableroots(a, [b], [a], includepath=False))

1741

return bool(self.reachableroots(a, [b], [a], includepath=False))

1742

1743

def reachableroots(self, minroot, heads, roots, includepath=False):

1743

def reachableroots(self, minroot, heads, roots, includepath=False):

1744

"""return (heads(::(<roots> and <roots>::<heads>)))

1744

"""return (heads(::(<roots> and <roots>::<heads>)))

1745

1746

If includepath is True, return (<roots>::<heads>)."""

1746

If includepath is True, return (<roots>::<heads>)."""

1747

try:

1747

try:

1748

return self.index.reachableroots2(

1748

return self.index.reachableroots2(

1749

minroot, heads, roots, includepath

1749

minroot, heads, roots, includepath

1750

)

1750

)

1751

except AttributeError:

1751

except AttributeError:

1752

return dagop._reachablerootspure(

1752

return dagop._reachablerootspure(

1753

self.parentrevs, minroot, roots, heads, includepath

1753

self.parentrevs, minroot, roots, heads, includepath

1754

)

1754

)

1755

1756

def ancestor(self, a, b):

1756

def ancestor(self, a, b):

1757

"""calculate the "best" common ancestor of nodes a and b"""

1757

"""calculate the "best" common ancestor of nodes a and b"""

1758

1759

a, b = self.rev(a), self.rev(b)

1759

a, b = self.rev(a), self.rev(b)

1760

try:

1760

try:

1761

ancs = self.index.ancestors(a, b)

1761

ancs = self.index.ancestors(a, b)

1762

except (AttributeError, OverflowError):

1762

except (AttributeError, OverflowError):

1763

ancs = ancestor.ancestors(self.parentrevs, a, b)

1763

ancs = ancestor.ancestors(self.parentrevs, a, b)

1764

if ancs:

1764

if ancs:

1765

# choose a consistent winner when there's a tie

1765

# choose a consistent winner when there's a tie

1766

return min(map(self.node, ancs))

1766

return min(map(self.node, ancs))

1767

return self.nullid

1767

return self.nullid

1768

1769

def _match(self, id):

1769

def _match(self, id):

1770

if isinstance(id, int):

1770

if isinstance(id, int):

1771

# rev

1771

# rev

1772

return self.node(id)

1772

return self.node(id)

1773

if len(id) == self.nodeconstants.nodelen:

1773

if len(id) == self.nodeconstants.nodelen:

1774

# possibly a binary node

1774

# possibly a binary node

1775

# odds of a binary node being all hex in ASCII are 1 in 10**25

1775

# odds of a binary node being all hex in ASCII are 1 in 10**25

1776

try:

1776

try:

1777

node = id

1777

node = id

1778

self.rev(node) # quick search the index

1778

self.rev(node) # quick search the index

1779

return node

1779

return node

1780

except error.LookupError:

1780

except error.LookupError:

1781

pass # may be partial hex id

1781

pass # may be partial hex id

1782

try:

1782

try:

1783

# str(rev)

1783

# str(rev)

1784

rev = int(id)

1784

rev = int(id)

1785

if b"%d" % rev != id:

1785

if b"%d" % rev != id:

1786

raise ValueError

1786

raise ValueError

1787

if rev < 0:

1787

if rev < 0:

1788

rev = len(self) + rev

1788

rev = len(self) + rev

1789

if rev < 0 or rev >= len(self):

1789

if rev < 0 or rev >= len(self):

1790

raise ValueError

1790

raise ValueError

1791

return self.node(rev)

1791

return self.node(rev)

1792

except (ValueError, OverflowError):

1792

except (ValueError, OverflowError):

1793

pass

1793

pass

1794

if len(id) == 2 * self.nodeconstants.nodelen:

1794

if len(id) == 2 * self.nodeconstants.nodelen:

1795

try:

1795

try:

1796

# a full hex nodeid?

1796

# a full hex nodeid?

1797

node = bin(id)

1797

node = bin(id)

1798

self.rev(node)

1798

self.rev(node)

1799

return node

1799

return node

1800

except (binascii.Error, error.LookupError):

1800

except (binascii.Error, error.LookupError):

1801

pass

1801

pass

1802

1803

def _partialmatch(self, id):

1803

def _partialmatch(self, id):

1804

# we don't care wdirfilenodeids as they should be always full hash

1804

# we don't care wdirfilenodeids as they should be always full hash

1805

maybewdir = self.nodeconstants.wdirhex.startswith(id)

1805

maybewdir = self.nodeconstants.wdirhex.startswith(id)

1806

ambiguous = False

1806

ambiguous = False

1807

try:

1807

try:

1808

partial = self.index.partialmatch(id)

1808

partial = self.index.partialmatch(id)

1809

if partial and self.hasnode(partial):

1809

if partial and self.hasnode(partial):

1810

if maybewdir:

1810

if maybewdir:

1811

# single 'ff...' match in radix tree, ambiguous with wdir

1811

# single 'ff...' match in radix tree, ambiguous with wdir

1812

ambiguous = True

1812

ambiguous = True

1813

else:

1813

else:

1814

return partial

1814

return partial

1815

elif maybewdir:

1815

elif maybewdir:

1816

# no 'ff...' match in radix tree, wdir identified

1816

# no 'ff...' match in radix tree, wdir identified

1817

raise error.WdirUnsupported

1817

raise error.WdirUnsupported

1818

else:

1818

else:

1819

return None

1819

return None

1820

except error.RevlogError:

1820

except error.RevlogError:

1821

# parsers.c radix tree lookup gave multiple matches

1821

# parsers.c radix tree lookup gave multiple matches

1822

# fast path: for unfiltered changelog, radix tree is accurate

1822

# fast path: for unfiltered changelog, radix tree is accurate

1823

if not getattr(self, 'filteredrevs', None):

1823

if not getattr(self, 'filteredrevs', None):

1824

ambiguous = True

1824

ambiguous = True

1825

# fall through to slow path that filters hidden revisions

1825

# fall through to slow path that filters hidden revisions

1826

except (AttributeError, ValueError):

1826

except (AttributeError, ValueError):

1827

# we are pure python, or key is not hex

1827

# we are pure python, or key is not hex

1828

pass

1828

pass

1829

if ambiguous:

1829

if ambiguous:

1830

raise error.AmbiguousPrefixLookupError(

1830

raise error.AmbiguousPrefixLookupError(

1831

id, self.display_id, _(b'ambiguous identifier')

1831

id, self.display_id, _(b'ambiguous identifier')

1832

)

1832

)

1833

1834

if id in self._pcache:

1834

if id in self._pcache:

1835

return self._pcache[id]

1835

return self._pcache[id]

1836

1837

if len(id) <= 40:

1837

if len(id) <= 40:

1838

# hex(node)[:...]

1838

# hex(node)[:...]

1839

l = len(id) // 2 * 2 # grab an even number of digits

1839

l = len(id) // 2 * 2 # grab an even number of digits

1840

try:

1840

try:

1841

# we're dropping the last digit, so let's check that it's hex,

1841

# we're dropping the last digit, so let's check that it's hex,

1842

# to avoid the expensive computation below if it's not

1842

# to avoid the expensive computation below if it's not

1843

if len(id) % 2 > 0:

1843

if len(id) % 2 > 0:

1844

if not (id[-1] in hexdigits):

1844

if not (id[-1] in hexdigits):

1845

return None

1845

return None

1846

prefix = bin(id[:l])

1846

prefix = bin(id[:l])

1847

except binascii.Error:

1847

except binascii.Error:

1848

pass

1848

pass

1849

else:

1849

else:

1850

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

1850

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

1851

nl = [

1851

nl = [

1852

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

1852

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

1853

]

1853

]

1854

if self.nodeconstants.nullhex.startswith(id):

1854

if self.nodeconstants.nullhex.startswith(id):

1855

nl.append(self.nullid)

1855

nl.append(self.nullid)

1856

if len(nl) > 0:

1856

if len(nl) > 0:

1857

if len(nl) == 1 and not maybewdir:

1857

if len(nl) == 1 and not maybewdir:

1858

self._pcache[id] = nl[0]

1858

self._pcache[id] = nl[0]

1859

return nl[0]

1859

return nl[0]

1860

raise error.AmbiguousPrefixLookupError(

1860

raise error.AmbiguousPrefixLookupError(

1861

id, self.display_id, _(b'ambiguous identifier')

1861

id, self.display_id, _(b'ambiguous identifier')

1862

)

1862

)

1863

if maybewdir:

1863

if maybewdir:

1864

raise error.WdirUnsupported

1864

raise error.WdirUnsupported

1865

return None

1865

return None

1866

1867

def lookup(self, id):

1867

def lookup(self, id):

1868

"""locate a node based on:

1868

"""locate a node based on:

1869

- revision number or str(revision number)

1869

- revision number or str(revision number)

1870

- nodeid or subset of hex nodeid

1870

- nodeid or subset of hex nodeid

1871

"""

1871

"""

1872

n = self._match(id)

1872

n = self._match(id)

1873

if n is not None:

1873

if n is not None:

1874

return n

1874

return n

1875

n = self._partialmatch(id)

1875

n = self._partialmatch(id)

1876

if n:

1876

if n:

1877

return n

1877

return n

1878

1879

raise error.LookupError(id, self.display_id, _(b'no match found'))

1879

raise error.LookupError(id, self.display_id, _(b'no match found'))

1880

1881

def shortest(self, node, minlength=1):

1881

def shortest(self, node, minlength=1):

1882

"""Find the shortest unambiguous prefix that matches node."""

1882

"""Find the shortest unambiguous prefix that matches node."""

1883

1884

def isvalid(prefix):

1884

def isvalid(prefix):

1885

try:

1885

try:

1886

matchednode = self._partialmatch(prefix)

1886

matchednode = self._partialmatch(prefix)

1887

except error.AmbiguousPrefixLookupError:

1887

except error.AmbiguousPrefixLookupError:

1888

return False

1888

return False

1889

except error.WdirUnsupported:

1889

except error.WdirUnsupported:

1890

# single 'ff...' match

1890

# single 'ff...' match

1891

return True

1891

return True

1892

if matchednode is None:

1892

if matchednode is None:

1893

raise error.LookupError(node, self.display_id, _(b'no node'))

1893

raise error.LookupError(node, self.display_id, _(b'no node'))

1894

return True

1894

return True

1895

1896

def maybewdir(prefix):

1896

def maybewdir(prefix):

1897

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

1897

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

1898

1899

hexnode = hex(node)

1899

hexnode = hex(node)

1900

1901

def disambiguate(hexnode, minlength):

1901

def disambiguate(hexnode, minlength):

1902

"""Disambiguate against wdirid."""

1902

"""Disambiguate against wdirid."""

1903

for length in range(minlength, len(hexnode) + 1):

1903

for length in range(minlength, len(hexnode) + 1):

1904

prefix = hexnode[:length]

1904

prefix = hexnode[:length]

1905

if not maybewdir(prefix):

1905

if not maybewdir(prefix):

1906

return prefix

1906

return prefix

1907

1908

if not getattr(self, 'filteredrevs', None):

1908

if not getattr(self, 'filteredrevs', None):

1909

try:

1909

try:

1910

length = max(self.index.shortest(node), minlength)

1910

length = max(self.index.shortest(node), minlength)

1911

return disambiguate(hexnode, length)

1911

return disambiguate(hexnode, length)

1912

except error.RevlogError:

1912

except error.RevlogError:

1913

if node != self.nodeconstants.wdirid:

1913

if node != self.nodeconstants.wdirid:

1914

raise error.LookupError(

1914

raise error.LookupError(

1915

node, self.display_id, _(b'no node')

1915

node, self.display_id, _(b'no node')

1916

)

1916

)

1917

except AttributeError:

1917

except AttributeError:

1918

# Fall through to pure code

1918

# Fall through to pure code

1919

pass

1919

pass

1920

1921

if node == self.nodeconstants.wdirid:

1921

if node == self.nodeconstants.wdirid:

1922

for length in range(minlength, len(hexnode) + 1):

1922

for length in range(minlength, len(hexnode) + 1):

1923

prefix = hexnode[:length]

1923

prefix = hexnode[:length]

1924

if isvalid(prefix):

1924

if isvalid(prefix):

1925

return prefix

1925

return prefix

1926

1927

for length in range(minlength, len(hexnode) + 1):

1927

for length in range(minlength, len(hexnode) + 1):

1928

prefix = hexnode[:length]

1928

prefix = hexnode[:length]

1929

if isvalid(prefix):

1929

if isvalid(prefix):

1930

return disambiguate(hexnode, length)

1930

return disambiguate(hexnode, length)

1931

1932

def cmp(self, node, text):

1932

def cmp(self, node, text):

1933

"""compare text with a given file revision

1933

"""compare text with a given file revision

1934

1935

returns True if text is different than what is stored.

1935

returns True if text is different than what is stored.

1936

"""

1936

"""

1937

p1, p2 = self.parents(node)

1937

p1, p2 = self.parents(node)

1938

return storageutil.hashrevisionsha1(text, p1, p2) != node

1938

return storageutil.hashrevisionsha1(text, p1, p2) != node

1939

1940

def _getsegmentforrevs(self, startrev, endrev):

1940

def _getsegmentforrevs(self, startrev, endrev):

1941

"""Obtain a segment of raw data corresponding to a range of revisions.

1941

"""Obtain a segment of raw data corresponding to a range of revisions.

1942

1943

Accepts the start and end revisions and an optional already-open

1943

Accepts the start and end revisions and an optional already-open

1944

file handle to be used for reading. If the file handle is read, its

1944

file handle to be used for reading. If the file handle is read, its

1945

seek position will not be preserved.

1945

seek position will not be preserved.

1946

1947

Requests for data may be satisfied by a cache.

1947

Requests for data may be satisfied by a cache.

1948

1949

Returns a 2-tuple of (offset, data) for the requested range of

1949

Returns a 2-tuple of (offset, data) for the requested range of

1950

revisions. Offset is the integer offset from the beginning of the

1950

revisions. Offset is the integer offset from the beginning of the

1951

revlog and data is a str or buffer of the raw byte data.

1951

revlog and data is a str or buffer of the raw byte data.

1952

1953

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

1953

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

1954

to determine where each revision's data begins and ends.

1954

to determine where each revision's data begins and ends.

1955

"""

1955

"""

1956

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

1956

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

1957

# (functions are expensive).

1957

# (functions are expensive).

1958

index = self.index

1958

index = self.index

1959

istart = index[startrev]

1959

istart = index[startrev]

1960

start = int(istart[0] >> 16)

1960

start = int(istart[0] >> 16)

1961

if startrev == endrev:

1961

if startrev == endrev:

1962

end = start + istart[1]

1962

end = start + istart[1]

1963

else:

1963

else:

1964

iend = index[endrev]

1964

iend = index[endrev]

1965

end = int(iend[0] >> 16) + iend[1]

1965

end = int(iend[0] >> 16) + iend[1]

1966

1967

if self._inline:

1967

if self._inline:

1968

start += (startrev + 1) * self.index.entry_size

1968

start += (startrev + 1) * self.index.entry_size

1969

end += (endrev + 1) * self.index.entry_size

1969

end += (endrev + 1) * self.index.entry_size

1970

length = end - start

1970

length = end - start

1971

1972

return start, self._segmentfile.read_chunk(start, length)

1972

return start, self._segmentfile.read_chunk(start, length)

1973

1974

def _chunk(self, rev):

1974

def _chunk(self, rev):

1975

"""Obtain a single decompressed chunk for a revision.

1975

"""Obtain a single decompressed chunk for a revision.

1976

1977

Accepts an integer revision and an optional already-open file handle

1977

Accepts an integer revision and an optional already-open file handle

1978

to be used for reading. If used, the seek position of the file will not

1978

to be used for reading. If used, the seek position of the file will not

1979

be preserved.

1979

be preserved.

1980

1981

Returns a str holding uncompressed data for the requested revision.

1981

Returns a str holding uncompressed data for the requested revision.

1982

"""

1982

"""

1983

compression_mode = self.index[rev][10]

1983

compression_mode = self.index[rev][10]

1984

data = self._getsegmentforrevs(rev, rev)[1]

1984

data = self._getsegmentforrevs(rev, rev)[1]

1985

if compression_mode == COMP_MODE_PLAIN:

1985

if compression_mode == COMP_MODE_PLAIN:

1986

return data

1986

return data

1987

elif compression_mode == COMP_MODE_DEFAULT:

1987

elif compression_mode == COMP_MODE_DEFAULT:

1988

return self._decompressor(data)

1988

return self._decompressor(data)

1989

elif compression_mode == COMP_MODE_INLINE:

1989

elif compression_mode == COMP_MODE_INLINE:

1990

return self.decompress(data)

1990

return self.decompress(data)

1991

else:

1991

else:

1992

msg = b'unknown compression mode %d'

1992

msg = b'unknown compression mode %d'

1993

msg %= compression_mode

1993

msg %= compression_mode

1994

raise error.RevlogError(msg)

1994

raise error.RevlogError(msg)

1995

1996

def _chunks(self, revs, targetsize=None):

1996

def _chunks(self, revs, targetsize=None):

1997

"""Obtain decompressed chunks for the specified revisions.

1997

"""Obtain decompressed chunks for the specified revisions.

1998

1999

Accepts an iterable of numeric revisions that are assumed to be in

1999

Accepts an iterable of numeric revisions that are assumed to be in

2000

ascending order. Also accepts an optional already-open file handle

2000

ascending order. Also accepts an optional already-open file handle

2001

to be used for reading. If used, the seek position of the file will

2001

to be used for reading. If used, the seek position of the file will

2002

not be preserved.

2002

not be preserved.

2003

2004

This function is similar to calling ``self._chunk()`` multiple times,

2004

This function is similar to calling ``self._chunk()`` multiple times,

2005

but is faster.

2005

but is faster.

2006

2007

Returns a list with decompressed data for each requested revision.

2007

Returns a list with decompressed data for each requested revision.

2008

"""

2008

"""

2009

if not revs:

2009

if not revs:

2010

return []

2010

return []

2011

start = self.start

2011

start = self.start

2012

length = self.length

2012

length = self.length

2013

inline = self._inline

2013

inline = self._inline

2014

iosize = self.index.entry_size

2014

iosize = self.index.entry_size

2015

buffer = util.buffer

2015

buffer = util.buffer

2016

2017

l = []

2017

l = []

2018

ladd = l.append

2018

ladd = l.append

2019

2020

if not self._withsparseread:

2020

if not self._withsparseread:

2021

slicedchunks = (revs,)

2021

slicedchunks = (revs,)

2022

else:

2022

else:

2023

slicedchunks = deltautil.slicechunk(

2023

slicedchunks = deltautil.slicechunk(

2024

self, revs, targetsize=targetsize

2024

self, revs, targetsize=targetsize

2025

)

2025

)

2026

2027

for revschunk in slicedchunks:

2027

for revschunk in slicedchunks:

2028

firstrev = revschunk[0]

2028

firstrev = revschunk[0]

2029

# Skip trailing revisions with empty diff

2029

# Skip trailing revisions with empty diff

2030

for lastrev in revschunk[::-1]:

2030

for lastrev in revschunk[::-1]:

2031

if length(lastrev) != 0:

2031

if length(lastrev) != 0:

2032

break

2032

break

2033

2034

try:

2034

try:

2035

offset, data = self._getsegmentforrevs(firstrev, lastrev)

2035

offset, data = self._getsegmentforrevs(firstrev, lastrev)

2036

except OverflowError:

2036

except OverflowError:

2037

# issue4215 - we can't cache a run of chunks greater than

2037

# issue4215 - we can't cache a run of chunks greater than

2038

# 2G on Windows

2038

# 2G on Windows

2039

return [self._chunk(rev) for rev in revschunk]

2039

return [self._chunk(rev) for rev in revschunk]

2040

2041

decomp = self.decompress

2041

decomp = self.decompress

2042

# self._decompressor might be None, but will not be used in that case

2042

# self._decompressor might be None, but will not be used in that case

2043

def_decomp = self._decompressor

2043

def_decomp = self._decompressor

2044

for rev in revschunk:

2044

for rev in revschunk:

2045

chunkstart = start(rev)

2045

chunkstart = start(rev)

2046

if inline:

2046

if inline:

2047

chunkstart += (rev + 1) * iosize

2047

chunkstart += (rev + 1) * iosize

2048

chunklength = length(rev)

2048

chunklength = length(rev)

2049

comp_mode = self.index[rev][10]

2049

comp_mode = self.index[rev][10]

2050

c = buffer(data, chunkstart - offset, chunklength)

2050

c = buffer(data, chunkstart - offset, chunklength)

2051

if comp_mode == COMP_MODE_PLAIN:

2051

if comp_mode == COMP_MODE_PLAIN:

2052

ladd(c)

2052

ladd(c)

2053

elif comp_mode == COMP_MODE_INLINE:

2053

elif comp_mode == COMP_MODE_INLINE:

2054

ladd(decomp(c))

2054

ladd(decomp(c))

2055

elif comp_mode == COMP_MODE_DEFAULT:

2055

elif comp_mode == COMP_MODE_DEFAULT:

2056

ladd(def_decomp(c))

2056

ladd(def_decomp(c))

2057

else:

2057

else:

2058

msg = b'unknown compression mode %d'

2058

msg = b'unknown compression mode %d'

2059

msg %= comp_mode

2059

msg %= comp_mode

2060

raise error.RevlogError(msg)

2060

raise error.RevlogError(msg)

2061

2062

return l

2062

return l

2063

2064

def deltaparent(self, rev):

2064

def deltaparent(self, rev):

2065

"""return deltaparent of the given revision"""

2065

"""return deltaparent of the given revision"""

2066

base = self.index[rev][3]

2066

base = self.index[rev][3]

2067

if base == rev:

2067

if base == rev:

2068

return nullrev

2068

return nullrev

2069

elif self.delta_config.general_delta:

2069

elif self.delta_config.general_delta:

2070

return base

2070

return base

2071

else:

2071

else:

2072

return rev - 1

2072

return rev - 1

2073

2074

def issnapshot(self, rev):

2074

def issnapshot(self, rev):

2075

"""tells whether rev is a snapshot"""

2075

"""tells whether rev is a snapshot"""

2076

if not self._sparserevlog:

2076

if not self._sparserevlog:

2077

return self.deltaparent(rev) == nullrev

2077

return self.deltaparent(rev) == nullrev

2078

elif hasattr(self.index, 'issnapshot'):

2078

elif hasattr(self.index, 'issnapshot'):

2079

# directly assign the method to cache the testing and access

2079

# directly assign the method to cache the testing and access

2080

self.issnapshot = self.index.issnapshot

2080

self.issnapshot = self.index.issnapshot

2081

return self.issnapshot(rev)

2081

return self.issnapshot(rev)

2082

if rev == nullrev:

2082

if rev == nullrev:

2083

return True

2083

return True

2084

entry = self.index[rev]

2084

entry = self.index[rev]

2085

base = entry[3]

2085

base = entry[3]

2086

if base == rev:

2086

if base == rev:

2087

return True

2087

return True

2088

if base == nullrev:

2088

if base == nullrev:

2089

return True

2089

return True

2090

p1 = entry[5]

2090

p1 = entry[5]

2091

while self.length(p1) == 0:

2091

while self.length(p1) == 0:

2092

b = self.deltaparent(p1)

2092

b = self.deltaparent(p1)

2093

if b == p1:

2093

if b == p1:

2094

break

2094

break

2095

p1 = b

2095

p1 = b

2096

p2 = entry[6]

2096

p2 = entry[6]

2097

while self.length(p2) == 0:

2097

while self.length(p2) == 0:

2098

b = self.deltaparent(p2)

2098

b = self.deltaparent(p2)

2099

if b == p2:

2099

if b == p2:

2100

break

2100

break

2101

p2 = b

2101

p2 = b

2102

if base == p1 or base == p2:

2102

if base == p1 or base == p2:

2103

return False

2103

return False

2104

return self.issnapshot(base)

2104

return self.issnapshot(base)

2105

2106

def snapshotdepth(self, rev):

2106

def snapshotdepth(self, rev):

2107

"""number of snapshot in the chain before this one"""

2107

"""number of snapshot in the chain before this one"""

2108

if not self.issnapshot(rev):

2108

if not self.issnapshot(rev):

2109

raise error.ProgrammingError(b'revision %d not a snapshot')

2109

raise error.ProgrammingError(b'revision %d not a snapshot')

2110

return len(self._deltachain(rev)[0]) - 1

2110

return len(self._deltachain(rev)[0]) - 1

2111

2112

def revdiff(self, rev1, rev2):

2112

def revdiff(self, rev1, rev2):

2113

"""return or calculate a delta between two revisions

2113

"""return or calculate a delta between two revisions

2114

2115

The delta calculated is in binary form and is intended to be written to

2115

The delta calculated is in binary form and is intended to be written to

2116

revlog data directly. So this function needs raw revision data.

2116

revlog data directly. So this function needs raw revision data.

2117

"""

2117

"""

2118

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2118

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2119

return bytes(self._chunk(rev2))

2119

return bytes(self._chunk(rev2))

2120

2121

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2121

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2122

2123

def revision(self, nodeorrev):

2123

def revision(self, nodeorrev):

2124

"""return an uncompressed revision of a given node or revision

2124

"""return an uncompressed revision of a given node or revision

2125

number.

2125

number.

2126

"""

2126

"""

2127

return self._revisiondata(nodeorrev)

2127

return self._revisiondata(nodeorrev)

2128

2129

def sidedata(self, nodeorrev):

2129

def sidedata(self, nodeorrev):

2130

"""a map of extra data related to the changeset but not part of the hash

2130

"""a map of extra data related to the changeset but not part of the hash

2131

2132

This function currently return a dictionary. However, more advanced

2132

This function currently return a dictionary. However, more advanced

2133

mapping object will likely be used in the future for a more

2133

mapping object will likely be used in the future for a more

2134

efficient/lazy code.

2134

efficient/lazy code.

2135

"""

2135

"""

2136

# deal with <nodeorrev> argument type

2136

# deal with <nodeorrev> argument type

2137

if isinstance(nodeorrev, int):

2137

if isinstance(nodeorrev, int):

2138

rev = nodeorrev

2138

rev = nodeorrev

2139

else:

2139

else:

2140

rev = self.rev(nodeorrev)

2140

rev = self.rev(nodeorrev)

2141

return self._sidedata(rev)

2141

return self._sidedata(rev)

2142

2143

def _revisiondata(self, nodeorrev, raw=False):

2143

def _revisiondata(self, nodeorrev, raw=False):

2144

# deal with <nodeorrev> argument type

2144

# deal with <nodeorrev> argument type

2145

if isinstance(nodeorrev, int):

2145

if isinstance(nodeorrev, int):

2146

rev = nodeorrev

2146

rev = nodeorrev

2147

node = self.node(rev)

2147

node = self.node(rev)

2148

else:

2148

else:

2149

node = nodeorrev

2149

node = nodeorrev

2150

rev = None

2150

rev = None

2151

2152

# fast path the special `nullid` rev

2152

# fast path the special `nullid` rev

2153

if node == self.nullid:

2153

if node == self.nullid:

2154

return b""

2154

return b""

2155

2156

# ``rawtext`` is the text as stored inside the revlog. Might be the

2156

# ``rawtext`` is the text as stored inside the revlog. Might be the

2157

# revision or might need to be processed to retrieve the revision.

2157

# revision or might need to be processed to retrieve the revision.

2158

rev, rawtext, validated = self._rawtext(node, rev)

2158

rev, rawtext, validated = self._rawtext(node, rev)

2159

2160

if raw and validated:

2160

if raw and validated:

2161

# if we don't want to process the raw text and that raw

2161

# if we don't want to process the raw text and that raw

2162

# text is cached, we can exit early.

2162

# text is cached, we can exit early.

2163

return rawtext

2163

return rawtext

2164

if rev is None:

2164

if rev is None:

2165

rev = self.rev(node)

2165

rev = self.rev(node)

2166

# the revlog's flag for this revision

2166

# the revlog's flag for this revision

2167

# (usually alter its state or content)

2167

# (usually alter its state or content)

2168

flags = self.flags(rev)

2168

flags = self.flags(rev)

2169

2170

if validated and flags == REVIDX_DEFAULT_FLAGS:

2170

if validated and flags == REVIDX_DEFAULT_FLAGS:

2171

# no extra flags set, no flag processor runs, text = rawtext

2171

# no extra flags set, no flag processor runs, text = rawtext

2172

return rawtext

2172

return rawtext

2173

2174

if raw:

2174

if raw:

2175

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2175

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2176

text = rawtext

2176

text = rawtext

2177

else:

2177

else:

2178

r = flagutil.processflagsread(self, rawtext, flags)

2178

r = flagutil.processflagsread(self, rawtext, flags)

2179

text, validatehash = r

2179

text, validatehash = r

2180

if validatehash:

2180

if validatehash:

2181

self.checkhash(text, node, rev=rev)

2181

self.checkhash(text, node, rev=rev)

2182

if not validated:

2182

if not validated:

2183

self._revisioncache = (node, rev, rawtext)

2183

self._revisioncache = (node, rev, rawtext)

2184

2185

return text

2185

return text

2186

2187

def _rawtext(self, node, rev):

2187

def _rawtext(self, node, rev):

2188

"""return the possibly unvalidated rawtext for a revision

2188

"""return the possibly unvalidated rawtext for a revision

2189

2190

returns (rev, rawtext, validated)

2190

returns (rev, rawtext, validated)

2191

"""

2191

"""

2192

2193

# revision in the cache (could be useful to apply delta)

2193

# revision in the cache (could be useful to apply delta)

2194

cachedrev = None

2194

cachedrev = None

2195

# An intermediate text to apply deltas to

2195

# An intermediate text to apply deltas to

2196

basetext = None

2196

basetext = None

2197

2198

# Check if we have the entry in cache

2198

# Check if we have the entry in cache

2199

# The cache entry looks like (node, rev, rawtext)

2199

# The cache entry looks like (node, rev, rawtext)

2200

if self._revisioncache:

2200

if self._revisioncache:

2201

if self._revisioncache[0] == node:

2201

if self._revisioncache[0] == node:

2202

return (rev, self._revisioncache[2], True)

2202

return (rev, self._revisioncache[2], True)

2203

cachedrev = self._revisioncache[1]

2203

cachedrev = self._revisioncache[1]

2204

2205

if rev is None:

2205

if rev is None:

2206

rev = self.rev(node)

2206

rev = self.rev(node)

2207

2208

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

2208

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

2209

if stopped:

2209

if stopped:

2210

basetext = self._revisioncache[2]

2210

basetext = self._revisioncache[2]

2211

2212

# drop cache to save memory, the caller is expected to

2212

# drop cache to save memory, the caller is expected to

2213

# update self._revisioncache after validating the text

2213

# update self._revisioncache after validating the text

2214

self._revisioncache = None

2214

self._revisioncache = None

2215

2216

targetsize = None

2216

targetsize = None

2217

rawsize = self.index[rev][2]

2217

rawsize = self.index[rev][2]

2218

if 0 <= rawsize:

2218

if 0 <= rawsize:

2219

targetsize = 4 * rawsize

2219

targetsize = 4 * rawsize

2220

2221

bins = self._chunks(chain, targetsize=targetsize)

2221

bins = self._chunks(chain, targetsize=targetsize)

2222

if basetext is None:

2222

if basetext is None:

2223

basetext = bytes(bins[0])

2223

basetext = bytes(bins[0])

2224

bins = bins[1:]

2224

bins = bins[1:]

2225

2226

rawtext = mdiff.patches(basetext, bins)

2226

rawtext = mdiff.patches(basetext, bins)

2227

del basetext # let us have a chance to free memory early

2227

del basetext # let us have a chance to free memory early

2228

return (rev, rawtext, False)

2228

return (rev, rawtext, False)

2229

2230

def _sidedata(self, rev):

2230

def _sidedata(self, rev):

2231

"""Return the sidedata for a given revision number."""

2231

"""Return the sidedata for a given revision number."""

2232

index_entry = self.index[rev]

2232

index_entry = self.index[rev]

2233

sidedata_offset = index_entry[8]

2233

sidedata_offset = index_entry[8]

2234

sidedata_size = index_entry[9]

2234

sidedata_size = index_entry[9]

2235

2236

if self._inline:

2236

if self._inline:

2237

sidedata_offset += self.index.entry_size * (1 + rev)

2237

sidedata_offset += self.index.entry_size * (1 + rev)

2238

if sidedata_size == 0:

2238

if sidedata_size == 0:

2239

return {}

2239

return {}

2240

2241

if self._docket.sidedata_end < sidedata_offset + sidedata_size:

2241

if self._docket.sidedata_end < sidedata_offset + sidedata_size:

2242

filename = self._sidedatafile

2242

filename = self._sidedatafile

2243

end = self._docket.sidedata_end

2243

end = self._docket.sidedata_end

2244

offset = sidedata_offset

2244

offset = sidedata_offset

2245

length = sidedata_size

2245

length = sidedata_size

2246

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

2246

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

2247

raise error.RevlogError(m)

2247

raise error.RevlogError(m)

2248

2249

comp_segment = self._segmentfile_sidedata.read_chunk(

2249

comp_segment = self._segmentfile_sidedata.read_chunk(

2250

sidedata_offset, sidedata_size

2250

sidedata_offset, sidedata_size

2251

)

2251

)

2252

2253

comp = self.index[rev][11]

2253

comp = self.index[rev][11]

2254

if comp == COMP_MODE_PLAIN:

2254

if comp == COMP_MODE_PLAIN:

2255

segment = comp_segment

2255

segment = comp_segment

2256

elif comp == COMP_MODE_DEFAULT:

2256

elif comp == COMP_MODE_DEFAULT:

2257

segment = self._decompressor(comp_segment)

2257

segment = self._decompressor(comp_segment)

2258

elif comp == COMP_MODE_INLINE:

2258

elif comp == COMP_MODE_INLINE:

2259

segment = self.decompress(comp_segment)

2259

segment = self.decompress(comp_segment)

2260

else:

2260

else:

2261

msg = b'unknown compression mode %d'

2261

msg = b'unknown compression mode %d'

2262

msg %= comp

2262

msg %= comp

2263

raise error.RevlogError(msg)

2263

raise error.RevlogError(msg)

2264

2265

sidedata = sidedatautil.deserialize_sidedata(segment)

2265

sidedata = sidedatautil.deserialize_sidedata(segment)

2266

return sidedata

2266

return sidedata

2267

2268

def rawdata(self, nodeorrev):

2268

def rawdata(self, nodeorrev):

2269

"""return an uncompressed raw data of a given node or revision number."""

2269

"""return an uncompressed raw data of a given node or revision number."""

2270

return self._revisiondata(nodeorrev, raw=True)

2270

return self._revisiondata(nodeorrev, raw=True)

2271

2272

def hash(self, text, p1, p2):

2272

def hash(self, text, p1, p2):

2273

"""Compute a node hash.

2273

"""Compute a node hash.

2274

2275

Available as a function so that subclasses can replace the hash

2275

Available as a function so that subclasses can replace the hash

2276

as needed.

2276

as needed.

2277

"""

2277

"""

2278

return storageutil.hashrevisionsha1(text, p1, p2)

2278

return storageutil.hashrevisionsha1(text, p1, p2)

2279

2280

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2280

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2281

"""Check node hash integrity.

2281

"""Check node hash integrity.

2282

2283

Available as a function so that subclasses can extend hash mismatch

2283

Available as a function so that subclasses can extend hash mismatch

2284

behaviors as needed.

2284

behaviors as needed.

2285

"""

2285

"""

2286

try:

2286

try:

2287

if p1 is None and p2 is None:

2287

if p1 is None and p2 is None:

2288

p1, p2 = self.parents(node)

2288

p1, p2 = self.parents(node)

2289

if node != self.hash(text, p1, p2):

2289

if node != self.hash(text, p1, p2):

2290

# Clear the revision cache on hash failure. The revision cache

2290

# Clear the revision cache on hash failure. The revision cache

2291

# only stores the raw revision and clearing the cache does have

2291

# only stores the raw revision and clearing the cache does have

2292

# the side-effect that we won't have a cache hit when the raw

2292

# the side-effect that we won't have a cache hit when the raw

2293

# revision data is accessed. But this case should be rare and

2293

# revision data is accessed. But this case should be rare and

2294

# it is extra work to teach the cache about the hash

2294

# it is extra work to teach the cache about the hash

2295

# verification state.

2295

# verification state.

2296

if self._revisioncache and self._revisioncache[0] == node:

2296

if self._revisioncache and self._revisioncache[0] == node:

2297

self._revisioncache = None

2297

self._revisioncache = None

2298

2299

revornode = rev

2299

revornode = rev

2300

if revornode is None:

2300

if revornode is None:

2301

revornode = templatefilters.short(hex(node))

2301

revornode = templatefilters.short(hex(node))

2302

raise error.RevlogError(

2302

raise error.RevlogError(

2303

_(b"integrity check failed on %s:%s")

2303

_(b"integrity check failed on %s:%s")

2304

% (self.display_id, pycompat.bytestr(revornode))

2304

% (self.display_id, pycompat.bytestr(revornode))

2305

)

2305

)

2306

except error.RevlogError:

2306

except error.RevlogError:

2307

if self._censorable and storageutil.iscensoredtext(~~text~~):

2307

if self.feature_config.censorable and storageutil.iscensoredtext(

2308

text

2309

):

2308

raise error.CensoredNodeError(self.display_id, node, text)

2310

raise error.CensoredNodeError(self.display_id, node, text)

2309

raise

2311

raise

2310

2312

2311

@property

2313

@property

2312

def _split_index_file(self):

2314

def _split_index_file(self):

2313

"""the path where to expect the index of an ongoing splitting operation

2315

"""the path where to expect the index of an ongoing splitting operation

2314

2316

2315

The file will only exist if a splitting operation is in progress, but

2317

The file will only exist if a splitting operation is in progress, but

2316

it is always expected at the same location."""

2318

it is always expected at the same location."""

2317

parts = self.radix.split(b'/')

2319

parts = self.radix.split(b'/')

2318

if len(parts) > 1:

2320

if len(parts) > 1:

2319

# adds a '-s' prefix to the ``data/` or `meta/` base

2321

# adds a '-s' prefix to the ``data/` or `meta/` base

2320

head = parts[0] + b'-s'

2322

head = parts[0] + b'-s'

2321

mids = parts[1:-1]

2323

mids = parts[1:-1]

2322

tail = parts[-1] + b'.i'

2324

tail = parts[-1] + b'.i'

2323

pieces = [head] + mids + [tail]

2325

pieces = [head] + mids + [tail]

2324

return b'/'.join(pieces)

2326

return b'/'.join(pieces)

2325

else:

2327

else:

2326

# the revlog is stored at the root of the store (changelog or

2328

# the revlog is stored at the root of the store (changelog or

2327

# manifest), no risk of collision.

2329

# manifest), no risk of collision.

2328

return self.radix + b'.i.s'

2330

return self.radix + b'.i.s'

2329

2331

2330

def _enforceinlinesize(self, tr, side_write=True):

2332

def _enforceinlinesize(self, tr, side_write=True):

2331

"""Check if the revlog is too big for inline and convert if so.

2333

"""Check if the revlog is too big for inline and convert if so.

2332

2334

2333

This should be called after revisions are added to the revlog. If the

2335

This should be called after revisions are added to the revlog. If the

2334

revlog has grown too large to be an inline revlog, it will convert it

2336

revlog has grown too large to be an inline revlog, it will convert it

2335

to use multiple index and data files.

2337

to use multiple index and data files.

2336

"""

2338

"""

2337

tiprev = len(self) - 1

2339

tiprev = len(self) - 1

2338

total_size = self.start(tiprev) + self.length(tiprev)

2340

total_size = self.start(tiprev) + self.length(tiprev)

2339

if not self._inline or total_size < _maxinline:

2341

if not self._inline or total_size < _maxinline:

2340

return

2342

return

2341

2343

2342

troffset = tr.findoffset(self._indexfile)

2344

troffset = tr.findoffset(self._indexfile)

2343

if troffset is None:

2345

if troffset is None:

2344

raise error.RevlogError(

2346

raise error.RevlogError(

2345

_(b"%s not found in the transaction") % self._indexfile

2347

_(b"%s not found in the transaction") % self._indexfile

2346

)

2348

)

2347

if troffset:

2349

if troffset:

2348

tr.addbackup(self._indexfile, for_offset=True)

2350

tr.addbackup(self._indexfile, for_offset=True)

2349

tr.add(self._datafile, 0)

2351

tr.add(self._datafile, 0)

2350

2352

2351

existing_handles = False

2353

existing_handles = False

2352

if self._writinghandles is not None:

2354

if self._writinghandles is not None:

2353

existing_handles = True

2355

existing_handles = True

2354

fp = self._writinghandles[0]

2356

fp = self._writinghandles[0]

2355

fp.flush()

2357

fp.flush()

2356

fp.close()

2358

fp.close()

2357

# We can't use the cached file handle after close(). So prevent

2359

# We can't use the cached file handle after close(). So prevent

2358

# its usage.

2360

# its usage.

2359

self._writinghandles = None

2361

self._writinghandles = None

2360

self._segmentfile.writing_handle = None

2362

self._segmentfile.writing_handle = None

2361

# No need to deal with sidedata writing handle as it is only

2363

# No need to deal with sidedata writing handle as it is only

2362

# relevant with revlog-v2 which is never inline, not reaching

2364

# relevant with revlog-v2 which is never inline, not reaching

2363

# this code

2365

# this code

2364

if side_write:

2366

if side_write:

2365

old_index_file_path = self._indexfile

2367

old_index_file_path = self._indexfile

2366

new_index_file_path = self._split_index_file

2368

new_index_file_path = self._split_index_file

2367

opener = self.opener

2369

opener = self.opener

2368

weak_self = weakref.ref(self)

2370

weak_self = weakref.ref(self)

2369

2371

2370

# the "split" index replace the real index when the transaction is finalized

2372

# the "split" index replace the real index when the transaction is finalized

2371

def finalize_callback(tr):

2373

def finalize_callback(tr):

2372

opener.rename(

2374

opener.rename(

2373

new_index_file_path,

2375

new_index_file_path,

2374

old_index_file_path,

2376

old_index_file_path,

2375

checkambig=True,

2377

checkambig=True,

2376

)

2378

)

2377

maybe_self = weak_self()

2379

maybe_self = weak_self()

2378

if maybe_self is not None:

2380

if maybe_self is not None:

2379

maybe_self._indexfile = old_index_file_path

2381

maybe_self._indexfile = old_index_file_path

2380

2382

2381

def abort_callback(tr):

2383

def abort_callback(tr):

2382

maybe_self = weak_self()

2384

maybe_self = weak_self()

2383

if maybe_self is not None:

2385

if maybe_self is not None:

2384

maybe_self._indexfile = old_index_file_path

2386

maybe_self._indexfile = old_index_file_path

2385

2387

2386

tr.registertmp(new_index_file_path)

2388

tr.registertmp(new_index_file_path)

2387

if self.target[1] is not None:

2389

if self.target[1] is not None:

2388

callback_id = b'000-revlog-split-%d-%s' % self.target

2390

callback_id = b'000-revlog-split-%d-%s' % self.target

2389

else:

2391

else:

2390

callback_id = b'000-revlog-split-%d' % self.target[0]

2392

callback_id = b'000-revlog-split-%d' % self.target[0]

2391

tr.addfinalize(callback_id, finalize_callback)

2393

tr.addfinalize(callback_id, finalize_callback)

2392

tr.addabort(callback_id, abort_callback)

2394

tr.addabort(callback_id, abort_callback)

2393

2395

2394

new_dfh = self._datafp(b'w+')

2396

new_dfh = self._datafp(b'w+')

2395

new_dfh.truncate(0) # drop any potentially existing data

2397

new_dfh.truncate(0) # drop any potentially existing data

2396

try:

2398

try:

2397

with self.reading():

2399

with self.reading():

2398

for r in self:

2400

for r in self:

2399

new_dfh.write(self._getsegmentforrevs(r, r)[1])

2401

new_dfh.write(self._getsegmentforrevs(r, r)[1])

2400

new_dfh.flush()

2402

new_dfh.flush()

2401

2403

2402

if side_write:

2404

if side_write:

2403

self._indexfile = new_index_file_path

2405

self._indexfile = new_index_file_path

2404

with self.__index_new_fp() as fp:

2406

with self.__index_new_fp() as fp:

2405

self._format_flags &= ~FLAG_INLINE_DATA

2407

self._format_flags &= ~FLAG_INLINE_DATA

2406

self._inline = False

2408

self._inline = False

2407

for i in self:

2409

for i in self:

2408

e = self.index.entry_binary(i)

2410

e = self.index.entry_binary(i)

2409

if i == 0 and self._docket is None:

2411

if i == 0 and self._docket is None:

2410

header = self._format_flags | self._format_version

2412

header = self._format_flags | self._format_version

2411

header = self.index.pack_header(header)

2413

header = self.index.pack_header(header)

2412

e = header + e

2414

e = header + e

2413

fp.write(e)

2415

fp.write(e)

2414

if self._docket is not None:

2416

if self._docket is not None:

2415

self._docket.index_end = fp.tell()

2417

self._docket.index_end = fp.tell()

2416

2418

2417

# If we don't use side-write, the temp file replace the real

2419

# If we don't use side-write, the temp file replace the real

2418

# index when we exit the context manager

2420

# index when we exit the context manager

2419

2421

2420

nodemaputil.setup_persistent_nodemap(tr, self)

2422

nodemaputil.setup_persistent_nodemap(tr, self)

2421

self._segmentfile = randomaccessfile.randomaccessfile(

2423

self._segmentfile = randomaccessfile.randomaccessfile(

2422

self.opener,

2424

self.opener,

2423

self._datafile,

2425

self._datafile,

2424

self._chunkcachesize,

2426

self._chunkcachesize,

2425

)

2427

)

2426

2428

2427

if existing_handles:

2429

if existing_handles:

2428

# switched from inline to conventional reopen the index

2430

# switched from inline to conventional reopen the index

2429

ifh = self.__index_write_fp()

2431

ifh = self.__index_write_fp()

2430

self._writinghandles = (ifh, new_dfh, None)

2432

self._writinghandles = (ifh, new_dfh, None)

2431

self._segmentfile.writing_handle = new_dfh

2433

self._segmentfile.writing_handle = new_dfh

2432

new_dfh = None

2434

new_dfh = None

2433

# No need to deal with sidedata writing handle as it is only

2435

# No need to deal with sidedata writing handle as it is only

2434

# relevant with revlog-v2 which is never inline, not reaching

2436

# relevant with revlog-v2 which is never inline, not reaching

2435

# this code

2437

# this code

2436

finally:

2438

finally:

2437

if new_dfh is not None:

2439

if new_dfh is not None:

2438

new_dfh.close()

2440

new_dfh.close()

2439

2441

2440

def _nodeduplicatecallback(self, transaction, node):

2442

def _nodeduplicatecallback(self, transaction, node):

2441

"""called when trying to add a node already stored."""

2443

"""called when trying to add a node already stored."""

2442

2444

2443

@contextlib.contextmanager

2445

@contextlib.contextmanager

2444

def reading(self):

2446

def reading(self):

2445

"""Context manager that keeps data and sidedata files open for reading"""

2447

"""Context manager that keeps data and sidedata files open for reading"""

2446

if len(self.index) == 0:

2448

if len(self.index) == 0:

2447

yield # nothing to be read

2449

yield # nothing to be read

2448

else:

2450

else:

2449

with self._segmentfile.reading():

2451

with self._segmentfile.reading():

2450

with self._segmentfile_sidedata.reading():

2452

with self._segmentfile_sidedata.reading():

2451

yield

2453

yield

2452

2454

2453

@contextlib.contextmanager

2455

@contextlib.contextmanager

2454

def _writing(self, transaction):

2456

def _writing(self, transaction):

2455

if self._trypending:

2457

if self._trypending:

2456

msg = b'try to write in a `trypending` revlog: %s'

2458

msg = b'try to write in a `trypending` revlog: %s'

2457

msg %= self.display_id

2459

msg %= self.display_id

2458

raise error.ProgrammingError(msg)

2460

raise error.ProgrammingError(msg)

2459

if self._writinghandles is not None:

2461

if self._writinghandles is not None:

2460

yield

2462

yield

2461

else:

2463

else:

2462

ifh = dfh = sdfh = None

2464

ifh = dfh = sdfh = None

2463

try:

2465

try:

2464

r = len(self)

2466

r = len(self)

2465

# opening the data file.

2467

# opening the data file.

2466

dsize = 0

2468

dsize = 0

2467

if r:

2469

if r:

2468

dsize = self.end(r - 1)

2470

dsize = self.end(r - 1)

2469

dfh = None

2471

dfh = None

2470

if not self._inline:

2472

if not self._inline:

2471

try:

2473

try:

2472

dfh = self._datafp(b"r+")

2474

dfh = self._datafp(b"r+")

2473

if self._docket is None:

2475

if self._docket is None:

2474

dfh.seek(0, os.SEEK_END)

2476

dfh.seek(0, os.SEEK_END)

2475

else:

2477

else:

2476

dfh.seek(self._docket.data_end, os.SEEK_SET)

2478

dfh.seek(self._docket.data_end, os.SEEK_SET)

2477

except FileNotFoundError:

2479

except FileNotFoundError:

2478

dfh = self._datafp(b"w+")

2480

dfh = self._datafp(b"w+")

2479

transaction.add(self._datafile, dsize)

2481

transaction.add(self._datafile, dsize)

2480

if self._sidedatafile is not None:

2482

if self._sidedatafile is not None:

2481

# revlog-v2 does not inline, help Pytype

2483

# revlog-v2 does not inline, help Pytype

2482

assert dfh is not None

2484

assert dfh is not None

2483

try:

2485

try:

2484

sdfh = self.opener(self._sidedatafile, mode=b"r+")

2486

sdfh = self.opener(self._sidedatafile, mode=b"r+")

2485

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

2487

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

2486

except FileNotFoundError:

2488

except FileNotFoundError:

2487

sdfh = self.opener(self._sidedatafile, mode=b"w+")

2489

sdfh = self.opener(self._sidedatafile, mode=b"w+")

2488

transaction.add(

2490

transaction.add(

2489

self._sidedatafile, self._docket.sidedata_end

2491

self._sidedatafile, self._docket.sidedata_end

2490

)

2492

)

2491

2493

2492

# opening the index file.

2494

# opening the index file.

2493

isize = r * self.index.entry_size

2495

isize = r * self.index.entry_size

2494

ifh = self.__index_write_fp()

2496

ifh = self.__index_write_fp()

2495

if self._inline:

2497

if self._inline:

2496

transaction.add(self._indexfile, dsize + isize)

2498

transaction.add(self._indexfile, dsize + isize)

2497

else:

2499

else:

2498

transaction.add(self._indexfile, isize)

2500

transaction.add(self._indexfile, isize)

2499

# exposing all file handle for writing.

2501

# exposing all file handle for writing.

2500

self._writinghandles = (ifh, dfh, sdfh)

2502

self._writinghandles = (ifh, dfh, sdfh)

2501

self._segmentfile.writing_handle = ifh if self._inline else dfh

2503

self._segmentfile.writing_handle = ifh if self._inline else dfh

2502

self._segmentfile_sidedata.writing_handle = sdfh

2504

self._segmentfile_sidedata.writing_handle = sdfh

2503

yield

2505

yield

2504

if self._docket is not None:

2506

if self._docket is not None:

2505

self._write_docket(transaction)

2507

self._write_docket(transaction)

2506

finally:

2508

finally:

2507

self._writinghandles = None

2509

self._writinghandles = None

2508

self._segmentfile.writing_handle = None

2510

self._segmentfile.writing_handle = None

2509

self._segmentfile_sidedata.writing_handle = None

2511

self._segmentfile_sidedata.writing_handle = None

2510

if dfh is not None:

2512

if dfh is not None:

2511

dfh.close()

2513

dfh.close()

2512

if sdfh is not None:

2514

if sdfh is not None:

2513

sdfh.close()

2515

sdfh.close()

2514

# closing the index file last to avoid exposing referent to

2516

# closing the index file last to avoid exposing referent to

2515

# potential unflushed data content.

2517

# potential unflushed data content.

2516

if ifh is not None:

2518

if ifh is not None:

2517

ifh.close()

2519

ifh.close()

2518

2520

2519

def _write_docket(self, transaction):

2521

def _write_docket(self, transaction):

2520

"""write the current docket on disk

2522

"""write the current docket on disk

2521

2523

2522

Exist as a method to help changelog to implement transaction logic

2524

Exist as a method to help changelog to implement transaction logic

2523

2525

2524

We could also imagine using the same transaction logic for all revlog

2526

We could also imagine using the same transaction logic for all revlog

2525

since docket are cheap."""

2527

since docket are cheap."""

2526

self._docket.write(transaction)

2528

self._docket.write(transaction)

2527

2529

2528

def addrevision(

2530

def addrevision(

2529

self,

2531

self,

2530

text,

2532

text,

2531

transaction,

2533

transaction,

2532

link,

2534

link,

2533

p1,

2535

p1,

2534

p2,

2536

p2,

2535

cachedelta=None,

2537

cachedelta=None,

2536

node=None,

2538

node=None,

2537

flags=REVIDX_DEFAULT_FLAGS,

2539

flags=REVIDX_DEFAULT_FLAGS,

2538

deltacomputer=None,

2540

deltacomputer=None,

2539

sidedata=None,

2541

sidedata=None,

2540

):

2542

):

2541

"""add a revision to the log

2543

"""add a revision to the log

2542

2544

2543

text - the revision data to add

2545

text - the revision data to add

2544

transaction - the transaction object used for rollback

2546

transaction - the transaction object used for rollback

2545

link - the linkrev data to add

2547

link - the linkrev data to add

2546

p1, p2 - the parent nodeids of the revision

2548

p1, p2 - the parent nodeids of the revision

2547

cachedelta - an optional precomputed delta

2549

cachedelta - an optional precomputed delta

2548

node - nodeid of revision; typically node is not specified, and it is

2550

node - nodeid of revision; typically node is not specified, and it is

2549

computed by default as hash(text, p1, p2), however subclasses might

2551

computed by default as hash(text, p1, p2), however subclasses might

2550

use different hashing method (and override checkhash() in such case)

2552

use different hashing method (and override checkhash() in such case)

2551

flags - the known flags to set on the revision

2553

flags - the known flags to set on the revision

2552

deltacomputer - an optional deltacomputer instance shared between

2554

deltacomputer - an optional deltacomputer instance shared between

2553

multiple calls

2555

multiple calls

2554

"""

2556

"""

2555

if link == nullrev:

2557

if link == nullrev:

2556

raise error.RevlogError(

2558

raise error.RevlogError(

2557

_(b"attempted to add linkrev -1 to %s") % self.display_id

2559

_(b"attempted to add linkrev -1 to %s") % self.display_id

2558

)

2560

)

2559

2561

2560

if sidedata is None:

2562

if sidedata is None:

2561

sidedata = {}

2563

sidedata = {}

2562

elif sidedata and not self.hassidedata:

2564

elif sidedata and not self.hassidedata:

2563

raise error.ProgrammingError(

2565

raise error.ProgrammingError(

2564

_(b"trying to add sidedata to a revlog who don't support them")

2566

_(b"trying to add sidedata to a revlog who don't support them")

2565

)

2567

)

2566

2568

2567

if flags:

2569

if flags:

2568

node = node or self.hash(text, p1, p2)

2570

node = node or self.hash(text, p1, p2)

2569

2571

2570

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2572

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2571

2573

2572

# If the flag processor modifies the revision data, ignore any provided

2574

# If the flag processor modifies the revision data, ignore any provided

2573

# cachedelta.

2575

# cachedelta.

2574

if rawtext != text:

2576

if rawtext != text:

2575

cachedelta = None

2577

cachedelta = None

2576

2578

2577

if len(rawtext) > _maxentrysize:

2579

if len(rawtext) > _maxentrysize:

2578

raise error.RevlogError(

2580

raise error.RevlogError(

2579

_(

2581

_(

2580

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2582

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2581

)

2583

)

2582

% (self.display_id, len(rawtext))

2584

% (self.display_id, len(rawtext))

2583

)

2585

)

2584

2586

2585

node = node or self.hash(rawtext, p1, p2)

2587

node = node or self.hash(rawtext, p1, p2)

2586

rev = self.index.get_rev(node)

2588

rev = self.index.get_rev(node)

2587

if rev is not None:

2589

if rev is not None:

2588

return rev

2590

return rev

2589

2591

2590

if validatehash:

2592

if validatehash:

2591

self.checkhash(rawtext, node, p1=p1, p2=p2)

2593

self.checkhash(rawtext, node, p1=p1, p2=p2)

2592

2594

2593

return self.addrawrevision(

2595

return self.addrawrevision(

2594

rawtext,

2596

rawtext,

2595

transaction,

2597

transaction,

2596

link,

2598

link,

2597

p1,

2599

p1,

2598

p2,

2600

p2,

2599

node,

2601

node,

2600

flags,

2602

flags,

2601

cachedelta=cachedelta,

2603

cachedelta=cachedelta,

2602

deltacomputer=deltacomputer,

2604

deltacomputer=deltacomputer,

2603

sidedata=sidedata,

2605

sidedata=sidedata,

2604

)

2606

)

2605

2607

2606

def addrawrevision(

2608

def addrawrevision(

2607

self,

2609

self,

2608

rawtext,

2610

rawtext,

2609

transaction,

2611

transaction,

2610

link,

2612

link,

2611

p1,

2613

p1,

2612

p2,

2614

p2,

2613

node,

2615

node,

2614

flags,

2616

flags,

2615

cachedelta=None,

2617

cachedelta=None,

2616

deltacomputer=None,

2618

deltacomputer=None,

2617

sidedata=None,

2619

sidedata=None,

2618

):

2620

):

2619

"""add a raw revision with known flags, node and parents

2621

"""add a raw revision with known flags, node and parents

2620

useful when reusing a revision not stored in this revlog (ex: received

2622

useful when reusing a revision not stored in this revlog (ex: received

2621

over wire, or read from an external bundle).

2623

over wire, or read from an external bundle).

2622

"""

2624

"""

2623

with self._writing(transaction):

2625

with self._writing(transaction):

2624

return self._addrevision(

2626

return self._addrevision(

2625

node,

2627

node,

2626

rawtext,

2628

rawtext,

2627

transaction,

2629

transaction,

2628

link,

2630

link,

2629

p1,

2631

p1,

2630

p2,

2632

p2,

2631

flags,

2633

flags,

2632

cachedelta,

2634

cachedelta,

2633

deltacomputer=deltacomputer,

2635

deltacomputer=deltacomputer,

2634

sidedata=sidedata,

2636

sidedata=sidedata,

2635

)

2637

)

2636

2638

2637

def compress(self, data):

2639

def compress(self, data):

2638

"""Generate a possibly-compressed representation of data."""

2640

"""Generate a possibly-compressed representation of data."""

2639

if not data:

2641

if not data:

2640

return b'', data

2642

return b'', data

2641

2643

2642

compressed = self._compressor.compress(data)

2644

compressed = self._compressor.compress(data)

2643

2645

2644

if compressed:

2646

if compressed:

2645

# The revlog compressor added the header in the returned data.

2647

# The revlog compressor added the header in the returned data.

2646

return b'', compressed

2648

return b'', compressed

2647

2649

2648

if data[0:1] == b'\0':

2650

if data[0:1] == b'\0':

2649

return b'', data

2651

return b'', data

2650

return b'u', data

2652

return b'u', data

2651

2653

2652

def decompress(self, data):

2654

def decompress(self, data):

2653

"""Decompress a revlog chunk.

2655

"""Decompress a revlog chunk.

2654

2656

2655

The chunk is expected to begin with a header identifying the

2657

The chunk is expected to begin with a header identifying the

2656

format type so it can be routed to an appropriate decompressor.

2658

format type so it can be routed to an appropriate decompressor.

2657

"""

2659

"""

2658

if not data:

2660

if not data:

2659

return data

2661

return data

2660

2662

2661

# Revlogs are read much more frequently than they are written and many

2663

# Revlogs are read much more frequently than they are written and many

2662

# chunks only take microseconds to decompress, so performance is

2664

# chunks only take microseconds to decompress, so performance is

2663

# important here.

2665

# important here.

2664

#

2666

#

2665

# We can make a few assumptions about revlogs:

2667

# We can make a few assumptions about revlogs:

2666

#

2668

#

2667

# 1) the majority of chunks will be compressed (as opposed to inline

2669

# 1) the majority of chunks will be compressed (as opposed to inline

2668

# raw data).

2670

# raw data).

2669

# 2) decompressing *any* data will likely by at least 10x slower than

2671

# 2) decompressing *any* data will likely by at least 10x slower than

2670

# returning raw inline data.

2672

# returning raw inline data.

2671

# 3) we want to prioritize common and officially supported compression

2673

# 3) we want to prioritize common and officially supported compression

2672

# engines

2674

# engines

2673

#

2675

#

2674

# It follows that we want to optimize for "decompress compressed data

2676

# It follows that we want to optimize for "decompress compressed data

2675

# when encoded with common and officially supported compression engines"

2677

# when encoded with common and officially supported compression engines"

2676

# case over "raw data" and "data encoded by less common or non-official

2678

# case over "raw data" and "data encoded by less common or non-official

2677

# compression engines." That is why we have the inline lookup first

2679

# compression engines." That is why we have the inline lookup first

2678

# followed by the compengines lookup.

2680

# followed by the compengines lookup.

2679

#

2681

#

2680

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

2682

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

2681

# compressed chunks. And this matters for changelog and manifest reads.

2683

# compressed chunks. And this matters for changelog and manifest reads.

2682

t = data[0:1]

2684

t = data[0:1]

2683

2685

2684

if t == b'x':

2686

if t == b'x':

2685

try:

2687

try:

2686

return _zlibdecompress(data)

2688

return _zlibdecompress(data)

2687

except zlib.error as e:

2689

except zlib.error as e:

2688

raise error.RevlogError(

2690

raise error.RevlogError(

2689

_(b'revlog decompress error: %s')

2691

_(b'revlog decompress error: %s')

2690

% stringutil.forcebytestr(e)

2692

% stringutil.forcebytestr(e)

2691

)

2693

)

2692

# '\0' is more common than 'u' so it goes first.

2694

# '\0' is more common than 'u' so it goes first.

2693

elif t == b'\0':

2695

elif t == b'\0':

2694

return data

2696

return data

2695

elif t == b'u':

2697

elif t == b'u':

2696

return util.buffer(data, 1)

2698

return util.buffer(data, 1)

2697

2699

2698

compressor = self._get_decompressor(t)

2700

compressor = self._get_decompressor(t)

2699

2701

2700

return compressor.decompress(data)

2702

return compressor.decompress(data)

2701

2703

2702

def _addrevision(

2704

def _addrevision(

2703

self,

2705

self,

2704

node,

2706

node,

2705

rawtext,

2707

rawtext,

2706

transaction,

2708

transaction,

2707

link,

2709

link,

2708

p1,

2710

p1,

2709

p2,

2711

p2,

2710

flags,

2712

flags,

2711

cachedelta,

2713

cachedelta,

2712

alwayscache=False,

2714

alwayscache=False,

2713

deltacomputer=None,

2715

deltacomputer=None,

2714

sidedata=None,

2716

sidedata=None,

2715

):

2717

):

2716

"""internal function to add revisions to the log

2718

"""internal function to add revisions to the log

2717

2719

2718

see addrevision for argument descriptions.

2720

see addrevision for argument descriptions.

2719

2721

2720

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

2722

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

2721

2723

2722

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

2724

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

2723

be used.

2725

be used.

2724

2726

2725

invariants:

2727

invariants:

2726

- rawtext is optional (can be None); if not set, cachedelta must be set.

2728

- rawtext is optional (can be None); if not set, cachedelta must be set.

2727

if both are set, they must correspond to each other.

2729

if both are set, they must correspond to each other.

2728

"""

2730

"""

2729

if node == self.nullid:

2731

if node == self.nullid:

2730

raise error.RevlogError(

2732

raise error.RevlogError(

2731

_(b"%s: attempt to add null revision") % self.display_id

2733

_(b"%s: attempt to add null revision") % self.display_id

2732

)

2734

)

2733

if (

2735

if (

2734

node == self.nodeconstants.wdirid

2736

node == self.nodeconstants.wdirid

2735

or node in self.nodeconstants.wdirfilenodeids

2737

or node in self.nodeconstants.wdirfilenodeids

2736

):

2738

):

2737

raise error.RevlogError(

2739

raise error.RevlogError(

2738

_(b"%s: attempt to add wdir revision") % self.display_id

2740

_(b"%s: attempt to add wdir revision") % self.display_id

2739

)

2741

)

2740

if self._writinghandles is None:

2742

if self._writinghandles is None:

2741

msg = b'adding revision outside `revlog._writing` context'

2743

msg = b'adding revision outside `revlog._writing` context'

2742

raise error.ProgrammingError(msg)

2744

raise error.ProgrammingError(msg)

2743

2745

2744

btext = [rawtext]

2746

btext = [rawtext]

2745

2747

2746

curr = len(self)

2748

curr = len(self)

2747

prev = curr - 1

2749

prev = curr - 1

2748

2750

2749

offset = self._get_data_offset(prev)

2751

offset = self._get_data_offset(prev)

2750

2752

2751

if self._concurrencychecker:

2753

if self._concurrencychecker:

2752

ifh, dfh, sdfh = self._writinghandles

2754

ifh, dfh, sdfh = self._writinghandles

2753

# XXX no checking for the sidedata file

2755

# XXX no checking for the sidedata file

2754

if self._inline:

2756

if self._inline:

2755

# offset is "as if" it were in the .d file, so we need to add on

2757

# offset is "as if" it were in the .d file, so we need to add on

2756

# the size of the entry metadata.

2758

# the size of the entry metadata.

2757

self._concurrencychecker(

2759

self._concurrencychecker(

2758

ifh, self._indexfile, offset + curr * self.index.entry_size

2760

ifh, self._indexfile, offset + curr * self.index.entry_size

2759

)

2761

)

2760

else:

2762

else:

2761

# Entries in the .i are a consistent size.

2763

# Entries in the .i are a consistent size.

2762

self._concurrencychecker(

2764

self._concurrencychecker(

2763

ifh, self._indexfile, curr * self.index.entry_size

2765

ifh, self._indexfile, curr * self.index.entry_size

2764

)

2766

)

2765

self._concurrencychecker(dfh, self._datafile, offset)

2767

self._concurrencychecker(dfh, self._datafile, offset)

2766

2768

2767

p1r, p2r = self.rev(p1), self.rev(p2)

2769

p1r, p2r = self.rev(p1), self.rev(p2)

2768

2770

2769

# full versions are inserted when the needed deltas

2771

# full versions are inserted when the needed deltas

2770

# become comparable to the uncompressed text

2772

# become comparable to the uncompressed text

2771

if rawtext is None:

2773

if rawtext is None:

2772

# need rawtext size, before changed by flag processors, which is

2774

# need rawtext size, before changed by flag processors, which is

2773

# the non-raw size. use revlog explicitly to avoid filelog's extra

2775

# the non-raw size. use revlog explicitly to avoid filelog's extra

2774

# logic that might remove metadata size.

2776

# logic that might remove metadata size.

2775

textlen = mdiff.patchedsize(

2777

textlen = mdiff.patchedsize(

2776

revlog.size(self, cachedelta[0]), cachedelta[1]

2778

revlog.size(self, cachedelta[0]), cachedelta[1]

2777

)

2779

)

2778

else:

2780

else:

2779

textlen = len(rawtext)

2781

textlen = len(rawtext)

2780

2782

2781

if deltacomputer is None:

2783

if deltacomputer is None:

2782

write_debug = None

2784

write_debug = None

2783

if self._debug_delta:

2785

if self._debug_delta:

2784

write_debug = transaction._report

2786

write_debug = transaction._report

2785

deltacomputer = deltautil.deltacomputer(

2787

deltacomputer = deltautil.deltacomputer(

2786

self, write_debug=write_debug

2788

self, write_debug=write_debug

2787

)

2789

)

2788

2790

2789

if cachedelta is not None and len(cachedelta) == 2:

2791

if cachedelta is not None and len(cachedelta) == 2:

2790

# If the cached delta has no information about how it should be

2792

# If the cached delta has no information about how it should be

2791

# reused, add the default reuse instruction according to the

2793

# reused, add the default reuse instruction according to the

2792

# revlog's configuration.

2794

# revlog's configuration.

2793

if (

2795

if (

2794

self.delta_config.general_delta

2796

self.delta_config.general_delta

2795

and self.delta_config.lazy_delta_base

2797

and self.delta_config.lazy_delta_base

2796

):

2798

):

2797

delta_base_reuse = DELTA_BASE_REUSE_TRY

2799

delta_base_reuse = DELTA_BASE_REUSE_TRY

2798

else:

2800

else:

2799

delta_base_reuse = DELTA_BASE_REUSE_NO

2801

delta_base_reuse = DELTA_BASE_REUSE_NO

2800

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

2802

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

2801

2803

2802

revinfo = revlogutils.revisioninfo(

2804

revinfo = revlogutils.revisioninfo(

2803

node,

2805

node,

2804

p1,

2806

p1,

2805

p2,

2807

p2,

2806

btext,

2808

btext,

2807

textlen,

2809

textlen,

2808

cachedelta,

2810

cachedelta,

2809

flags,

2811

flags,

2810

)

2812

)

2811

2813

2812

deltainfo = deltacomputer.finddeltainfo(revinfo)

2814

deltainfo = deltacomputer.finddeltainfo(revinfo)

2813

2815

2814

compression_mode = COMP_MODE_INLINE

2816

compression_mode = COMP_MODE_INLINE

2815

if self._docket is not None:

2817

if self._docket is not None:

2816

default_comp = self._docket.default_compression_header

2818

default_comp = self._docket.default_compression_header

2817

r = deltautil.delta_compression(default_comp, deltainfo)

2819

r = deltautil.delta_compression(default_comp, deltainfo)

2818

compression_mode, deltainfo = r

2820

compression_mode, deltainfo = r

2819

2821

2820

sidedata_compression_mode = COMP_MODE_INLINE

2822

sidedata_compression_mode = COMP_MODE_INLINE

2821

if sidedata and self.hassidedata:

2823

if sidedata and self.hassidedata:

2822

sidedata_compression_mode = COMP_MODE_PLAIN

2824

sidedata_compression_mode = COMP_MODE_PLAIN

2823

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

2825

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

2824

sidedata_offset = self._docket.sidedata_end

2826

sidedata_offset = self._docket.sidedata_end

2825

h, comp_sidedata = self.compress(serialized_sidedata)

2827

h, comp_sidedata = self.compress(serialized_sidedata)

2826

if (

2828

if (

2827

h != b'u'

2829

h != b'u'

2828

and comp_sidedata[0:1] != b'\0'

2830

and comp_sidedata[0:1] != b'\0'

2829

and len(comp_sidedata) < len(serialized_sidedata)

2831

and len(comp_sidedata) < len(serialized_sidedata)

2830

):

2832

):

2831

assert not h

2833

assert not h

2832

if (

2834

if (

2833

comp_sidedata[0:1]

2835

comp_sidedata[0:1]

2834

== self._docket.default_compression_header

2836

== self._docket.default_compression_header

2835

):

2837

):

2836

sidedata_compression_mode = COMP_MODE_DEFAULT

2838

sidedata_compression_mode = COMP_MODE_DEFAULT

2837

serialized_sidedata = comp_sidedata

2839

serialized_sidedata = comp_sidedata

2838

else:

2840

else:

2839

sidedata_compression_mode = COMP_MODE_INLINE

2841

sidedata_compression_mode = COMP_MODE_INLINE

2840

serialized_sidedata = comp_sidedata

2842

serialized_sidedata = comp_sidedata

2841

else:

2843

else:

2842

serialized_sidedata = b""

2844

serialized_sidedata = b""

2843

# Don't store the offset if the sidedata is empty, that way

2845

# Don't store the offset if the sidedata is empty, that way

2844

# we can easily detect empty sidedata and they will be no different

2846

# we can easily detect empty sidedata and they will be no different

2845

# than ones we manually add.

2847

# than ones we manually add.

2846

sidedata_offset = 0

2848

sidedata_offset = 0

2847

2849

2848

rank = RANK_UNKNOWN

2850

rank = RANK_UNKNOWN

2849

if self._compute_rank:

2851

if self._compute_rank:

2850

if (p1r, p2r) == (nullrev, nullrev):

2852

if (p1r, p2r) == (nullrev, nullrev):

2851

rank = 1

2853

rank = 1

2852

elif p1r != nullrev and p2r == nullrev:

2854

elif p1r != nullrev and p2r == nullrev:

2853

rank = 1 + self.fast_rank(p1r)

2855

rank = 1 + self.fast_rank(p1r)

2854

elif p1r == nullrev and p2r != nullrev:

2856

elif p1r == nullrev and p2r != nullrev:

2855

rank = 1 + self.fast_rank(p2r)

2857

rank = 1 + self.fast_rank(p2r)

2856

else: # merge node

2858

else: # merge node

2857

if rustdagop is not None and self.index.rust_ext_compat:

2859

if rustdagop is not None and self.index.rust_ext_compat:

2858

rank = rustdagop.rank(self.index, p1r, p2r)

2860

rank = rustdagop.rank(self.index, p1r, p2r)

2859

else:

2861

else:

2860

pmin, pmax = sorted((p1r, p2r))

2862

pmin, pmax = sorted((p1r, p2r))

2861

rank = 1 + self.fast_rank(pmax)

2863

rank = 1 + self.fast_rank(pmax)

2862

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

2864

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

2863

2865

2864

e = revlogutils.entry(

2866

e = revlogutils.entry(

2865

flags=flags,

2867

flags=flags,

2866

data_offset=offset,

2868

data_offset=offset,

2867

data_compressed_length=deltainfo.deltalen,

2869

data_compressed_length=deltainfo.deltalen,

2868

data_uncompressed_length=textlen,

2870

data_uncompressed_length=textlen,

2869

data_compression_mode=compression_mode,

2871

data_compression_mode=compression_mode,

2870

data_delta_base=deltainfo.base,

2872

data_delta_base=deltainfo.base,

2871

link_rev=link,

2873

link_rev=link,

2872

parent_rev_1=p1r,

2874

parent_rev_1=p1r,

2873

parent_rev_2=p2r,

2875

parent_rev_2=p2r,

2874

node_id=node,

2876

node_id=node,

2875

sidedata_offset=sidedata_offset,

2877

sidedata_offset=sidedata_offset,

2876

sidedata_compressed_length=len(serialized_sidedata),

2878

sidedata_compressed_length=len(serialized_sidedata),

2877

sidedata_compression_mode=sidedata_compression_mode,

2879

sidedata_compression_mode=sidedata_compression_mode,

2878

rank=rank,

2880

rank=rank,

2879

)

2881

)

2880

2882

2881

self.index.append(e)

2883

self.index.append(e)

2882

entry = self.index.entry_binary(curr)

2884

entry = self.index.entry_binary(curr)

2883

if curr == 0 and self._docket is None:

2885

if curr == 0 and self._docket is None:

2884

header = self._format_flags | self._format_version

2886

header = self._format_flags | self._format_version

2885

header = self.index.pack_header(header)

2887

header = self.index.pack_header(header)

2886

entry = header + entry

2888

entry = header + entry

2887

self._writeentry(

2889

self._writeentry(

2888

transaction,

2890

transaction,

2889

entry,

2891

entry,

2890

deltainfo.data,

2892

deltainfo.data,

2891

link,

2893

link,

2892

offset,

2894

offset,

2893

serialized_sidedata,

2895

serialized_sidedata,

2894

sidedata_offset,

2896

sidedata_offset,

2895

)

2897

)

2896

2898

2897

rawtext = btext[0]

2899

rawtext = btext[0]

2898

2900

2899

if alwayscache and rawtext is None:

2901

if alwayscache and rawtext is None:

2900

rawtext = deltacomputer.buildtext(revinfo)

2902

rawtext = deltacomputer.buildtext(revinfo)

2901

2903

2902

if type(rawtext) == bytes: # only accept immutable objects

2904

if type(rawtext) == bytes: # only accept immutable objects

2903

self._revisioncache = (node, curr, rawtext)

2905

self._revisioncache = (node, curr, rawtext)

2904

self._chainbasecache[curr] = deltainfo.chainbase

2906

self._chainbasecache[curr] = deltainfo.chainbase

2905

return curr

2907

return curr

2906

2908

2907

def _get_data_offset(self, prev):

2909

def _get_data_offset(self, prev):

2908

"""Returns the current offset in the (in-transaction) data file.

2910

"""Returns the current offset in the (in-transaction) data file.

2909

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

2911

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

2910

file to store that information: since sidedata can be rewritten to the

2912

file to store that information: since sidedata can be rewritten to the

2911

end of the data file within a transaction, you can have cases where, for

2913

end of the data file within a transaction, you can have cases where, for

2912

example, rev `n` does not have sidedata while rev `n - 1` does, leading

2914

example, rev `n` does not have sidedata while rev `n - 1` does, leading

2913

to `n - 1`'s sidedata being written after `n`'s data.

2915

to `n - 1`'s sidedata being written after `n`'s data.

2914

2916

2915

TODO cache this in a docket file before getting out of experimental."""

2917

TODO cache this in a docket file before getting out of experimental."""

2916

if self._docket is None:

2918

if self._docket is None:

2917

return self.end(prev)

2919

return self.end(prev)

2918

else:

2920

else:

2919

return self._docket.data_end

2921

return self._docket.data_end

2920

2922

2921

def _writeentry(

2923

def _writeentry(

2922

self, transaction, entry, data, link, offset, sidedata, sidedata_offset

2924

self, transaction, entry, data, link, offset, sidedata, sidedata_offset

2923

):

2925

):

2924

# Files opened in a+ mode have inconsistent behavior on various

2926

# Files opened in a+ mode have inconsistent behavior on various

2925

# platforms. Windows requires that a file positioning call be made

2927

# platforms. Windows requires that a file positioning call be made

2926

# when the file handle transitions between reads and writes. See

2928

# when the file handle transitions between reads and writes. See

2927

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

2929

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

2928

# platforms, Python or the platform itself can be buggy. Some versions

2930

# platforms, Python or the platform itself can be buggy. Some versions

2929

# of Solaris have been observed to not append at the end of the file

2931

# of Solaris have been observed to not append at the end of the file

2930

# if the file was seeked to before the end. See issue4943 for more.

2932

# if the file was seeked to before the end. See issue4943 for more.

2931

#

2933

#

2932

# We work around this issue by inserting a seek() before writing.

2934

# We work around this issue by inserting a seek() before writing.

2933

# Note: This is likely not necessary on Python 3. However, because

2935

# Note: This is likely not necessary on Python 3. However, because

2934

# the file handle is reused for reads and may be seeked there, we need

2936

# the file handle is reused for reads and may be seeked there, we need

2935

# to be careful before changing this.

2937

# to be careful before changing this.

2936

if self._writinghandles is None:

2938

if self._writinghandles is None:

2937

msg = b'adding revision outside `revlog._writing` context'

2939

msg = b'adding revision outside `revlog._writing` context'

2938

raise error.ProgrammingError(msg)

2940

raise error.ProgrammingError(msg)

2939

ifh, dfh, sdfh = self._writinghandles

2941

ifh, dfh, sdfh = self._writinghandles

2940

if self._docket is None:

2942

if self._docket is None:

2941

ifh.seek(0, os.SEEK_END)

2943

ifh.seek(0, os.SEEK_END)

2942

else:

2944

else:

2943

ifh.seek(self._docket.index_end, os.SEEK_SET)

2945

ifh.seek(self._docket.index_end, os.SEEK_SET)

2944

if dfh:

2946

if dfh:

2945

if self._docket is None:

2947

if self._docket is None:

2946

dfh.seek(0, os.SEEK_END)

2948

dfh.seek(0, os.SEEK_END)

2947

else:

2949

else:

2948

dfh.seek(self._docket.data_end, os.SEEK_SET)

2950

dfh.seek(self._docket.data_end, os.SEEK_SET)

2949

if sdfh:

2951

if sdfh:

2950

sdfh.seek(self._docket.sidedata_end, os.SEEK_SET)

2952

sdfh.seek(self._docket.sidedata_end, os.SEEK_SET)

2951

2953

2952

curr = len(self) - 1

2954

curr = len(self) - 1

2953

if not self._inline:

2955

if not self._inline:

2954

transaction.add(self._datafile, offset)

2956

transaction.add(self._datafile, offset)

2955

if self._sidedatafile:

2957

if self._sidedatafile:

2956

transaction.add(self._sidedatafile, sidedata_offset)

2958

transaction.add(self._sidedatafile, sidedata_offset)

2957

transaction.add(self._indexfile, curr * len(entry))

2959

transaction.add(self._indexfile, curr * len(entry))

2958

if data[0]:

2960

if data[0]:

2959

dfh.write(data[0])

2961

dfh.write(data[0])

2960

dfh.write(data[1])

2962

dfh.write(data[1])

2961

if sidedata:

2963

if sidedata:

2962

sdfh.write(sidedata)

2964

sdfh.write(sidedata)

2963

ifh.write(entry)

2965

ifh.write(entry)

2964

else:

2966

else:

2965

offset += curr * self.index.entry_size

2967

offset += curr * self.index.entry_size

2966

transaction.add(self._indexfile, offset)

2968

transaction.add(self._indexfile, offset)

2967

ifh.write(entry)

2969

ifh.write(entry)

2968

ifh.write(data[0])

2970

ifh.write(data[0])

2969

ifh.write(data[1])

2971

ifh.write(data[1])

2970

assert not sidedata

2972

assert not sidedata

2971

self._enforceinlinesize(transaction)

2973

self._enforceinlinesize(transaction)

2972

if self._docket is not None:

2974

if self._docket is not None:

2973

# revlog-v2 always has 3 writing handles, help Pytype

2975

# revlog-v2 always has 3 writing handles, help Pytype

2974

wh1 = self._writinghandles[0]

2976

wh1 = self._writinghandles[0]

2975

wh2 = self._writinghandles[1]

2977

wh2 = self._writinghandles[1]

2976

wh3 = self._writinghandles[2]

2978

wh3 = self._writinghandles[2]

2977

assert wh1 is not None

2979

assert wh1 is not None

2978

assert wh2 is not None

2980

assert wh2 is not None

2979

assert wh3 is not None

2981

assert wh3 is not None

2980

self._docket.index_end = wh1.tell()

2982

self._docket.index_end = wh1.tell()

2981

self._docket.data_end = wh2.tell()

2983

self._docket.data_end = wh2.tell()

2982

self._docket.sidedata_end = wh3.tell()

2984

self._docket.sidedata_end = wh3.tell()

2983

2985

2984

nodemaputil.setup_persistent_nodemap(transaction, self)

2986

nodemaputil.setup_persistent_nodemap(transaction, self)

2985

2987

2986

def addgroup(

2988

def addgroup(

2987

self,

2989

self,

2988

deltas,

2990

deltas,

2989

linkmapper,

2991

linkmapper,

2990

transaction,

2992

transaction,

2991

alwayscache=False,

2993

alwayscache=False,

2992

addrevisioncb=None,

2994

addrevisioncb=None,

2993

duplicaterevisioncb=None,

2995

duplicaterevisioncb=None,

2994

debug_info=None,

2996

debug_info=None,

2995

delta_base_reuse_policy=None,

2997

delta_base_reuse_policy=None,

2996

):

2998

):

2997

"""

2999

"""

2998

add a delta group

3000

add a delta group

2999

3001

3000

given a set of deltas, add them to the revision log. the

3002

given a set of deltas, add them to the revision log. the

3001

first delta is against its parent, which should be in our

3003

first delta is against its parent, which should be in our

3002

log, the rest are against the previous delta.

3004

log, the rest are against the previous delta.

3003

3005

3004

If ``addrevisioncb`` is defined, it will be called with arguments of

3006

If ``addrevisioncb`` is defined, it will be called with arguments of

3005

this revlog and the node that was added.

3007

this revlog and the node that was added.

3006

"""

3008

"""

3007

3009

3008

if self._adding_group:

3010

if self._adding_group:

3009

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3011

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3010

3012

3011

# read the default delta-base reuse policy from revlog config if the

3013

# read the default delta-base reuse policy from revlog config if the

3012

# group did not specify one.

3014

# group did not specify one.

3013

if delta_base_reuse_policy is None:

3015

if delta_base_reuse_policy is None:

3014

if (

3016

if (

3015

self.delta_config.general_delta

3017

self.delta_config.general_delta

3016

and self.delta_config.lazy_delta_base

3018

and self.delta_config.lazy_delta_base

3017

):

3019

):

3018

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3020

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3019

else:

3021

else:

3020

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3022

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3021

3023

3022

self._adding_group = True

3024

self._adding_group = True

3023

empty = True

3025

empty = True

3024

try:

3026

try:

3025

with self._writing(transaction):

3027

with self._writing(transaction):

3026

write_debug = None

3028

write_debug = None

3027

if self._debug_delta:

3029

if self._debug_delta:

3028

write_debug = transaction._report

3030

write_debug = transaction._report

3029

deltacomputer = deltautil.deltacomputer(

3031

deltacomputer = deltautil.deltacomputer(

3030

self,

3032

self,

3031

write_debug=write_debug,

3033

write_debug=write_debug,

3032

debug_info=debug_info,

3034

debug_info=debug_info,

3033

)

3035

)

3034

# loop through our set of deltas

3036

# loop through our set of deltas

3035

for data in deltas:

3037

for data in deltas:

3036

(

3038

(

3037

node,

3039

node,

3038

p1,

3040

p1,

3039

p2,

3041

p2,

3040

linknode,

3042

linknode,

3041

deltabase,

3043

deltabase,

3042

delta,

3044

delta,

3043

flags,

3045

flags,

3044

sidedata,

3046

sidedata,

3045

) = data

3047

) = data

3046

link = linkmapper(linknode)

3048

link = linkmapper(linknode)

3047

flags = flags or REVIDX_DEFAULT_FLAGS

3049

flags = flags or REVIDX_DEFAULT_FLAGS

3048

3050

3049

rev = self.index.get_rev(node)

3051

rev = self.index.get_rev(node)

3050

if rev is not None:

3052

if rev is not None:

3051

# this can happen if two branches make the same change

3053

# this can happen if two branches make the same change

3052

self._nodeduplicatecallback(transaction, rev)

3054

self._nodeduplicatecallback(transaction, rev)

3053

if duplicaterevisioncb:

3055

if duplicaterevisioncb:

3054

duplicaterevisioncb(self, rev)

3056

duplicaterevisioncb(self, rev)

3055

empty = False

3057

empty = False

3056

continue

3058

continue

3057

3059

3058

for p in (p1, p2):

3060

for p in (p1, p2):

3059

if not self.index.has_node(p):

3061

if not self.index.has_node(p):

3060

raise error.LookupError(

3062

raise error.LookupError(

3061

p, self.radix, _(b'unknown parent')

3063

p, self.radix, _(b'unknown parent')

3062

)

3064

)

3063

3065

3064

if not self.index.has_node(deltabase):

3066

if not self.index.has_node(deltabase):

3065

raise error.LookupError(

3067

raise error.LookupError(

3066

deltabase, self.display_id, _(b'unknown delta base')

3068

deltabase, self.display_id, _(b'unknown delta base')

3067

)

3069

)

3068

3070

3069

baserev = self.rev(deltabase)

3071

baserev = self.rev(deltabase)

3070

3072

3071

if baserev != nullrev and self.iscensored(baserev):

3073

if baserev != nullrev and self.iscensored(baserev):

3072

# if base is censored, delta must be full replacement in a

3074

# if base is censored, delta must be full replacement in a

3073

# single patch operation

3075

# single patch operation

3074

hlen = struct.calcsize(b">lll")

3076

hlen = struct.calcsize(b">lll")

3075

oldlen = self.rawsize(baserev)

3077

oldlen = self.rawsize(baserev)

3076

newlen = len(delta) - hlen

3078

newlen = len(delta) - hlen

3077

if delta[:hlen] != mdiff.replacediffheader(

3079

if delta[:hlen] != mdiff.replacediffheader(

3078

oldlen, newlen

3080

oldlen, newlen

3079

):

3081

):

3080

raise error.CensoredBaseError(

3082

raise error.CensoredBaseError(

3081

self.display_id, self.node(baserev)

3083

self.display_id, self.node(baserev)

3082

)

3084

)

3083

3085

3084

if not flags and self._peek_iscensored(baserev, delta):

3086

if not flags and self._peek_iscensored(baserev, delta):

3085

flags |= REVIDX_ISCENSORED

3087

flags |= REVIDX_ISCENSORED

3086

3088

3087

# We assume consumers of addrevisioncb will want to retrieve

3089

# We assume consumers of addrevisioncb will want to retrieve

3088

# the added revision, which will require a call to

3090

# the added revision, which will require a call to

3089

# revision(). revision() will fast path if there is a cache

3091

# revision(). revision() will fast path if there is a cache

3090

# hit. So, we tell _addrevision() to always cache in this case.

3092

# hit. So, we tell _addrevision() to always cache in this case.

3091

# We're only using addgroup() in the context of changegroup

3093

# We're only using addgroup() in the context of changegroup

3092

# generation so the revision data can always be handled as raw

3094

# generation so the revision data can always be handled as raw

3093

# by the flagprocessor.

3095

# by the flagprocessor.

3094

rev = self._addrevision(

3096

rev = self._addrevision(

3095

node,

3097

node,

3096

None,

3098

None,

3097

transaction,

3099

transaction,

3098

link,

3100

link,

3099

p1,

3101

p1,

3100

p2,

3102

p2,

3101

flags,

3103

flags,

3102

(baserev, delta, delta_base_reuse_policy),

3104

(baserev, delta, delta_base_reuse_policy),

3103

alwayscache=alwayscache,

3105

alwayscache=alwayscache,

3104

deltacomputer=deltacomputer,

3106

deltacomputer=deltacomputer,

3105

sidedata=sidedata,

3107

sidedata=sidedata,

3106

)

3108

)

3107

3109

3108

if addrevisioncb:

3110

if addrevisioncb:

3109

addrevisioncb(self, rev)

3111

addrevisioncb(self, rev)

3110

empty = False

3112

empty = False

3111

finally:

3113

finally:

3112

self._adding_group = False

3114

self._adding_group = False

3113

return not empty

3115

return not empty

3114

3116

3115

def iscensored(self, rev):

3117

def iscensored(self, rev):

3116

"""Check if a file revision is censored."""

3118

"""Check if a file revision is censored."""

3117

if not self._censorable:

3119

if not self.feature_config.censorable:

3118

return False

3120

return False

3119

3121

3120

return self.flags(rev) & REVIDX_ISCENSORED

3122

return self.flags(rev) & REVIDX_ISCENSORED

3121

3123

3122

def _peek_iscensored(self, baserev, delta):

3124

def _peek_iscensored(self, baserev, delta):

3123

"""Quickly check if a delta produces a censored revision."""

3125

"""Quickly check if a delta produces a censored revision."""

3124

if not self._censorable:

3126

if not self.feature_config.censorable:

3125

return False

3127

return False

3126

3128

3127

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3129

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3128

3130

3129

def getstrippoint(self, minlink):

3131

def getstrippoint(self, minlink):

3130

"""find the minimum rev that must be stripped to strip the linkrev

3132

"""find the minimum rev that must be stripped to strip the linkrev

3131

3133

3132

Returns a tuple containing the minimum rev and a set of all revs that

3134

Returns a tuple containing the minimum rev and a set of all revs that

3133

have linkrevs that will be broken by this strip.

3135

have linkrevs that will be broken by this strip.

3134

"""

3136

"""

3135

return storageutil.resolvestripinfo(

3137

return storageutil.resolvestripinfo(

3136

minlink,

3138

minlink,

3137

len(self) - 1,

3139

len(self) - 1,

3138

self.headrevs(),

3140

self.headrevs(),

3139

self.linkrev,

3141

self.linkrev,

3140

self.parentrevs,

3142

self.parentrevs,

3141

)

3143

)

3142

3144

3143

def strip(self, minlink, transaction):

3145

def strip(self, minlink, transaction):

3144

"""truncate the revlog on the first revision with a linkrev >= minlink

3146

"""truncate the revlog on the first revision with a linkrev >= minlink

3145

3147

3146

This function is called when we're stripping revision minlink and

3148

This function is called when we're stripping revision minlink and

3147

its descendants from the repository.

3149

its descendants from the repository.

3148

3150

3149

We have to remove all revisions with linkrev >= minlink, because

3151

We have to remove all revisions with linkrev >= minlink, because

3150

the equivalent changelog revisions will be renumbered after the

3152

the equivalent changelog revisions will be renumbered after the

3151

strip.

3153

strip.

3152

3154

3153

So we truncate the revlog on the first of these revisions, and

3155

So we truncate the revlog on the first of these revisions, and

3154

trust that the caller has saved the revisions that shouldn't be

3156

trust that the caller has saved the revisions that shouldn't be

3155

removed and that it'll re-add them after this truncation.

3157

removed and that it'll re-add them after this truncation.

3156

"""

3158

"""

3157

if len(self) == 0:

3159

if len(self) == 0:

3158

return

3160

return

3159

3161

3160

rev, _ = self.getstrippoint(minlink)

3162

rev, _ = self.getstrippoint(minlink)

3161

if rev == len(self):

3163

if rev == len(self):

3162

return

3164

return

3163

3165

3164

# first truncate the files on disk

3166

# first truncate the files on disk

3165

data_end = self.start(rev)

3167

data_end = self.start(rev)

3166

if not self._inline:

3168

if not self._inline:

3167

transaction.add(self._datafile, data_end)

3169

transaction.add(self._datafile, data_end)

3168

end = rev * self.index.entry_size

3170

end = rev * self.index.entry_size

3169

else:

3171

else:

3170

end = data_end + (rev * self.index.entry_size)

3172

end = data_end + (rev * self.index.entry_size)

3171

3173

3172

if self._sidedatafile:

3174

if self._sidedatafile:

3173

sidedata_end = self.sidedata_cut_off(rev)

3175

sidedata_end = self.sidedata_cut_off(rev)

3174

transaction.add(self._sidedatafile, sidedata_end)

3176

transaction.add(self._sidedatafile, sidedata_end)

3175

3177

3176

transaction.add(self._indexfile, end)

3178

transaction.add(self._indexfile, end)

3177

if self._docket is not None:

3179

if self._docket is not None:

3178

# XXX we could, leverage the docket while stripping. However it is

3180

# XXX we could, leverage the docket while stripping. However it is

3179

# not powerfull enough at the time of this comment

3181

# not powerfull enough at the time of this comment

3180

self._docket.index_end = end

3182

self._docket.index_end = end

3181

self._docket.data_end = data_end

3183

self._docket.data_end = data_end

3182

self._docket.sidedata_end = sidedata_end

3184

self._docket.sidedata_end = sidedata_end

3183

self._docket.write(transaction, stripping=True)

3185

self._docket.write(transaction, stripping=True)

3184

3186

3185

# then reset internal state in memory to forget those revisions

3187

# then reset internal state in memory to forget those revisions

3186

self._revisioncache = None

3188

self._revisioncache = None

3187

self._chaininfocache = util.lrucachedict(500)

3189

self._chaininfocache = util.lrucachedict(500)

3188

self._segmentfile.clear_cache()

3190

self._segmentfile.clear_cache()

3189

self._segmentfile_sidedata.clear_cache()

3191

self._segmentfile_sidedata.clear_cache()

3190

3192

3191

del self.index[rev:-1]

3193

del self.index[rev:-1]

3192

3194

3193

def checksize(self):

3195

def checksize(self):

3194

"""Check size of index and data files

3196

"""Check size of index and data files

3195

3197

3196

return a (dd, di) tuple.

3198

return a (dd, di) tuple.

3197

- dd: extra bytes for the "data" file

3199

- dd: extra bytes for the "data" file

3198

- di: extra bytes for the "index" file

3200

- di: extra bytes for the "index" file

3199

3201

3200

A healthy revlog will return (0, 0).

3202

A healthy revlog will return (0, 0).

3201

"""

3203

"""

3202

expected = 0

3204

expected = 0

3203

if len(self):

3205

if len(self):

3204

expected = max(0, self.end(len(self) - 1))

3206

expected = max(0, self.end(len(self) - 1))

3205

3207

3206

try:

3208

try:

3207

with self._datafp() as f:

3209

with self._datafp() as f:

3208

f.seek(0, io.SEEK_END)

3210

f.seek(0, io.SEEK_END)

3209

actual = f.tell()

3211

actual = f.tell()

3210

dd = actual - expected

3212

dd = actual - expected

3211

except FileNotFoundError:

3213

except FileNotFoundError:

3212

dd = 0

3214

dd = 0

3213

3215

3214

try:

3216

try:

3215

f = self.opener(self._indexfile)

3217

f = self.opener(self._indexfile)

3216

f.seek(0, io.SEEK_END)

3218

f.seek(0, io.SEEK_END)

3217

actual = f.tell()

3219

actual = f.tell()

3218

f.close()

3220

f.close()

3219

s = self.index.entry_size

3221

s = self.index.entry_size

3220

i = max(0, actual // s)

3222

i = max(0, actual // s)

3221

di = actual - (i * s)

3223

di = actual - (i * s)

3222

if self._inline:

3224

if self._inline:

3223

databytes = 0

3225

databytes = 0

3224

for r in self:

3226

for r in self:

3225

databytes += max(0, self.length(r))

3227

databytes += max(0, self.length(r))

3226

dd = 0

3228

dd = 0

3227

di = actual - len(self) * s - databytes

3229

di = actual - len(self) * s - databytes

3228

except FileNotFoundError:

3230

except FileNotFoundError:

3229

di = 0

3231

di = 0

3230

3232

3231

return (dd, di)

3233

return (dd, di)

3232

3234

3233

def files(self):

3235

def files(self):

3234

res = [self._indexfile]

3236

res = [self._indexfile]

3235

if self._docket_file is None:

3237

if self._docket_file is None:

3236

if not self._inline:

3238

if not self._inline:

3237

res.append(self._datafile)

3239

res.append(self._datafile)

3238

else:

3240

else:

3239

res.append(self._docket_file)

3241

res.append(self._docket_file)

3240

res.extend(self._docket.old_index_filepaths(include_empty=False))

3242

res.extend(self._docket.old_index_filepaths(include_empty=False))

3241

if self._docket.data_end:

3243

if self._docket.data_end:

3242

res.append(self._datafile)

3244

res.append(self._datafile)

3243

res.extend(self._docket.old_data_filepaths(include_empty=False))

3245

res.extend(self._docket.old_data_filepaths(include_empty=False))

3244

if self._docket.sidedata_end:

3246

if self._docket.sidedata_end:

3245

res.append(self._sidedatafile)

3247

res.append(self._sidedatafile)

3246

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3248

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3247

return res

3249

return res

3248

3250

3249

def emitrevisions(

3251

def emitrevisions(

3250

self,

3252

self,

3251

nodes,

3253

nodes,

3252

nodesorder=None,

3254

nodesorder=None,

3253

revisiondata=False,

3255

revisiondata=False,

3254

assumehaveparentrevisions=False,

3256

assumehaveparentrevisions=False,

3255

deltamode=repository.CG_DELTAMODE_STD,

3257

deltamode=repository.CG_DELTAMODE_STD,

3256

sidedata_helpers=None,

3258

sidedata_helpers=None,

3257

debug_info=None,

3259

debug_info=None,

3258

):

3260

):

3259

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3261

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3260

raise error.ProgrammingError(

3262

raise error.ProgrammingError(

3261

b'unhandled value for nodesorder: %s' % nodesorder

3263

b'unhandled value for nodesorder: %s' % nodesorder

3262

)

3264

)

3263

3265

3264

if nodesorder is None and not self.delta_config.general_delta:

3266

if nodesorder is None and not self.delta_config.general_delta:

3265

nodesorder = b'storage'

3267

nodesorder = b'storage'

3266

3268

3267

if (

3269

if (

3268

not self._storedeltachains

3270

not self._storedeltachains

3269

and deltamode != repository.CG_DELTAMODE_PREV

3271

and deltamode != repository.CG_DELTAMODE_PREV

3270

):

3272

):

3271

deltamode = repository.CG_DELTAMODE_FULL

3273

deltamode = repository.CG_DELTAMODE_FULL

3272

3274

3273

return storageutil.emitrevisions(

3275

return storageutil.emitrevisions(

3274

self,

3276

self,

3275

nodes,

3277

nodes,

3276

nodesorder,

3278

nodesorder,

3277

revlogrevisiondelta,

3279

revlogrevisiondelta,

3278

deltaparentfn=self.deltaparent,

3280

deltaparentfn=self.deltaparent,

3279

candeltafn=self._candelta,

3281

candeltafn=self._candelta,

3280

rawsizefn=self.rawsize,

3282

rawsizefn=self.rawsize,

3281

revdifffn=self.revdiff,

3283

revdifffn=self.revdiff,

3282

flagsfn=self.flags,

3284

flagsfn=self.flags,

3283

deltamode=deltamode,

3285

deltamode=deltamode,

3284

revisiondata=revisiondata,

3286

revisiondata=revisiondata,

3285

assumehaveparentrevisions=assumehaveparentrevisions,

3287

assumehaveparentrevisions=assumehaveparentrevisions,

3286

sidedata_helpers=sidedata_helpers,

3288

sidedata_helpers=sidedata_helpers,

3287

debug_info=debug_info,

3289

debug_info=debug_info,

3288

)

3290

)

3289

3291

3290

DELTAREUSEALWAYS = b'always'

3292

DELTAREUSEALWAYS = b'always'

3291

DELTAREUSESAMEREVS = b'samerevs'

3293

DELTAREUSESAMEREVS = b'samerevs'

3292

DELTAREUSENEVER = b'never'

3294

DELTAREUSENEVER = b'never'

3293

3295

3294

DELTAREUSEFULLADD = b'fulladd'

3296

DELTAREUSEFULLADD = b'fulladd'

3295

3297

3296

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3298

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3297

3299

3298

def clone(

3300

def clone(

3299

self,

3301

self,

3300

tr,

3302

tr,

3301

destrevlog,

3303

destrevlog,

3302

addrevisioncb=None,

3304

addrevisioncb=None,

3303

deltareuse=DELTAREUSESAMEREVS,

3305

deltareuse=DELTAREUSESAMEREVS,

3304

forcedeltabothparents=None,

3306

forcedeltabothparents=None,

3305

sidedata_helpers=None,

3307

sidedata_helpers=None,

3306

):

3308

):

3307

"""Copy this revlog to another, possibly with format changes.

3309

"""Copy this revlog to another, possibly with format changes.

3308

3310

3309

The destination revlog will contain the same revisions and nodes.

3311

The destination revlog will contain the same revisions and nodes.

3310

However, it may not be bit-for-bit identical due to e.g. delta encoding

3312

However, it may not be bit-for-bit identical due to e.g. delta encoding

3311

differences.

3313

differences.

3312

3314

3313

The ``deltareuse`` argument control how deltas from the existing revlog

3315

The ``deltareuse`` argument control how deltas from the existing revlog

3314

are preserved in the destination revlog. The argument can have the

3316

are preserved in the destination revlog. The argument can have the

3315

following values:

3317

following values:

3316

3318

3317

DELTAREUSEALWAYS

3319

DELTAREUSEALWAYS

3318

Deltas will always be reused (if possible), even if the destination

3320

Deltas will always be reused (if possible), even if the destination

3319

revlog would not select the same revisions for the delta. This is the

3321

revlog would not select the same revisions for the delta. This is the

3320

fastest mode of operation.

3322

fastest mode of operation.

3321

DELTAREUSESAMEREVS

3323

DELTAREUSESAMEREVS

3322

Deltas will be reused if the destination revlog would pick the same

3324

Deltas will be reused if the destination revlog would pick the same

3323

revisions for the delta. This mode strikes a balance between speed

3325

revisions for the delta. This mode strikes a balance between speed

3324

and optimization.

3326

and optimization.

3325

DELTAREUSENEVER

3327

DELTAREUSENEVER

3326

Deltas will never be reused. This is the slowest mode of execution.

3328

Deltas will never be reused. This is the slowest mode of execution.

3327

This mode can be used to recompute deltas (e.g. if the diff/delta

3329

This mode can be used to recompute deltas (e.g. if the diff/delta

3328

algorithm changes).

3330

algorithm changes).

3329

DELTAREUSEFULLADD

3331

DELTAREUSEFULLADD

3330

Revision will be re-added as if their were new content. This is

3332

Revision will be re-added as if their were new content. This is

3331

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3333

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3332

eg: large file detection and handling.

3334

eg: large file detection and handling.

3333

3335

3334

Delta computation can be slow, so the choice of delta reuse policy can

3336

Delta computation can be slow, so the choice of delta reuse policy can

3335

significantly affect run time.

3337

significantly affect run time.

3336

3338

3337

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3339

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3338

two extremes. Deltas will be reused if they are appropriate. But if the

3340

two extremes. Deltas will be reused if they are appropriate. But if the

3339

delta could choose a better revision, it will do so. This means if you

3341

delta could choose a better revision, it will do so. This means if you

3340

are converting a non-generaldelta revlog to a generaldelta revlog,

3342

are converting a non-generaldelta revlog to a generaldelta revlog,

3341

deltas will be recomputed if the delta's parent isn't a parent of the

3343

deltas will be recomputed if the delta's parent isn't a parent of the

3342

revision.

3344

revision.

3343

3345

3344

In addition to the delta policy, the ``forcedeltabothparents``

3346

In addition to the delta policy, the ``forcedeltabothparents``

3345

argument controls whether to force compute deltas against both parents

3347

argument controls whether to force compute deltas against both parents

3346

for merges. By default, the current default is used.

3348

for merges. By default, the current default is used.

3347

3349

3348

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3350

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3349

`sidedata_helpers`.

3351

`sidedata_helpers`.

3350

"""

3352

"""

3351

if deltareuse not in self.DELTAREUSEALL:

3353

if deltareuse not in self.DELTAREUSEALL:

3352

raise ValueError(

3354

raise ValueError(

3353

_(b'value for deltareuse invalid: %s') % deltareuse

3355

_(b'value for deltareuse invalid: %s') % deltareuse

3354

)

3356

)

3355

3357

3356

if len(destrevlog):

3358

if len(destrevlog):

3357

raise ValueError(_(b'destination revlog is not empty'))

3359

raise ValueError(_(b'destination revlog is not empty'))

3358

3360

3359

if getattr(self, 'filteredrevs', None):

3361

if getattr(self, 'filteredrevs', None):

3360

raise ValueError(_(b'source revlog has filtered revisions'))

3362

raise ValueError(_(b'source revlog has filtered revisions'))

3361

if getattr(destrevlog, 'filteredrevs', None):

3363

if getattr(destrevlog, 'filteredrevs', None):

3362

raise ValueError(_(b'destination revlog has filtered revisions'))

3364

raise ValueError(_(b'destination revlog has filtered revisions'))

3363

3365

3364

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3366

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3365

# if possible.

3367

# if possible.

3366

old_delta_config = destrevlog.delta_config

3368

old_delta_config = destrevlog.delta_config

3367

destrevlog.delta_config = destrevlog.delta_config.copy()

3369

destrevlog.delta_config = destrevlog.delta_config.copy()

3368

3370

3369

try:

3371

try:

3370

if deltareuse == self.DELTAREUSEALWAYS:

3372

if deltareuse == self.DELTAREUSEALWAYS:

3371

destrevlog.delta_config.lazy_delta_base = True

3373

destrevlog.delta_config.lazy_delta_base = True

3372

destrevlog.delta_config.lazy_delta = True

3374

destrevlog.delta_config.lazy_delta = True

3373

elif deltareuse == self.DELTAREUSESAMEREVS:

3375

elif deltareuse == self.DELTAREUSESAMEREVS:

3374

destrevlog.delta_config.lazy_delta_base = False

3376

destrevlog.delta_config.lazy_delta_base = False

3375

destrevlog.delta_config.lazy_delta = True

3377

destrevlog.delta_config.lazy_delta = True

3376

elif deltareuse == self.DELTAREUSENEVER:

3378

elif deltareuse == self.DELTAREUSENEVER:

3377

destrevlog.delta_config.lazy_delta_base = False

3379

destrevlog.delta_config.lazy_delta_base = False

3378

destrevlog.delta_config.lazy_delta = False

3380

destrevlog.delta_config.lazy_delta = False

3379

3381

3380

delta_both_parents = (

3382

delta_both_parents = (

3381

forcedeltabothparents or old_delta_config.delta_both_parents

3383

forcedeltabothparents or old_delta_config.delta_both_parents

3382

)

3384

)

3383

destrevlog.delta_config.delta_both_parents = delta_both_parents

3385

destrevlog.delta_config.delta_both_parents = delta_both_parents

3384

3386

3385

with self.reading():

3387

with self.reading():

3386

self._clone(

3388

self._clone(

3387

tr,

3389

tr,

3388

destrevlog,

3390

destrevlog,

3389

addrevisioncb,

3391

addrevisioncb,

3390

deltareuse,

3392

deltareuse,

3391

forcedeltabothparents,

3393

forcedeltabothparents,

3392

sidedata_helpers,

3394

sidedata_helpers,

3393

)

3395

)

3394

3396

3395

finally:

3397

finally:

3396

destrevlog.delta_config = old_delta_config

3398

destrevlog.delta_config = old_delta_config

3397

3399

3398

def _clone(

3400

def _clone(

3399

self,

3401

self,

3400

tr,

3402

tr,

3401

destrevlog,

3403

destrevlog,

3402

addrevisioncb,

3404

addrevisioncb,

3403

deltareuse,

3405

deltareuse,

3404

forcedeltabothparents,

3406

forcedeltabothparents,

3405

sidedata_helpers,

3407

sidedata_helpers,

3406

):

3408

):

3407

"""perform the core duty of `revlog.clone` after parameter processing"""

3409

"""perform the core duty of `revlog.clone` after parameter processing"""

3408

write_debug = None

3410

write_debug = None

3409

if self._debug_delta:

3411

if self._debug_delta:

3410

write_debug = tr._report

3412

write_debug = tr._report

3411

deltacomputer = deltautil.deltacomputer(

3413

deltacomputer = deltautil.deltacomputer(

3412

destrevlog,

3414

destrevlog,

3413

write_debug=write_debug,

3415

write_debug=write_debug,

3414

)

3416

)

3415

index = self.index

3417

index = self.index

3416

for rev in self:

3418

for rev in self:

3417

entry = index[rev]

3419

entry = index[rev]

3418

3420

3419

# Some classes override linkrev to take filtered revs into

3421

# Some classes override linkrev to take filtered revs into

3420

# account. Use raw entry from index.

3422

# account. Use raw entry from index.

3421

flags = entry[0] & 0xFFFF

3423

flags = entry[0] & 0xFFFF

3422

linkrev = entry[4]

3424

linkrev = entry[4]

3423

p1 = index[entry[5]][7]

3425

p1 = index[entry[5]][7]

3424

p2 = index[entry[6]][7]

3426

p2 = index[entry[6]][7]

3425

node = entry[7]

3427

node = entry[7]

3426

3428

3427

# (Possibly) reuse the delta from the revlog if allowed and

3429

# (Possibly) reuse the delta from the revlog if allowed and

3428

# the revlog chunk is a delta.

3430

# the revlog chunk is a delta.

3429

cachedelta = None

3431

cachedelta = None

3430

rawtext = None

3432

rawtext = None

3431

if deltareuse == self.DELTAREUSEFULLADD:

3433

if deltareuse == self.DELTAREUSEFULLADD:

3432

text = self._revisiondata(rev)

3434

text = self._revisiondata(rev)

3433

sidedata = self.sidedata(rev)

3435

sidedata = self.sidedata(rev)

3434

3436

3435

if sidedata_helpers is not None:

3437

if sidedata_helpers is not None:

3436

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3438

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3437

self, sidedata_helpers, sidedata, rev

3439

self, sidedata_helpers, sidedata, rev

3438

)

3440

)

3439

flags = flags | new_flags[0] & ~new_flags[1]

3441

flags = flags | new_flags[0] & ~new_flags[1]

3440

3442

3441

destrevlog.addrevision(

3443

destrevlog.addrevision(

3442

text,

3444

text,

3443

tr,

3445

tr,

3444

linkrev,

3446

linkrev,

3445

p1,

3447

p1,

3446

p2,

3448

p2,

3447

cachedelta=cachedelta,

3449

cachedelta=cachedelta,

3448

node=node,

3450

node=node,

3449

flags=flags,

3451

flags=flags,

3450

deltacomputer=deltacomputer,

3452

deltacomputer=deltacomputer,

3451

sidedata=sidedata,

3453

sidedata=sidedata,

3452

)

3454

)

3453

else:

3455

else:

3454

if destrevlog._lazydelta:

3456

if destrevlog._lazydelta:

3455

dp = self.deltaparent(rev)

3457

dp = self.deltaparent(rev)

3456

if dp != nullrev:

3458

if dp != nullrev:

3457

cachedelta = (dp, bytes(self._chunk(rev)))

3459

cachedelta = (dp, bytes(self._chunk(rev)))

3458

3460

3459

sidedata = None

3461

sidedata = None

3460

if not cachedelta:

3462

if not cachedelta:

3461

rawtext = self._revisiondata(rev)

3463

rawtext = self._revisiondata(rev)

3462

sidedata = self.sidedata(rev)

3464

sidedata = self.sidedata(rev)

3463

if sidedata is None:

3465

if sidedata is None:

3464

sidedata = self.sidedata(rev)

3466

sidedata = self.sidedata(rev)

3465

3467

3466

if sidedata_helpers is not None:

3468

if sidedata_helpers is not None:

3467

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3469

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3468

self, sidedata_helpers, sidedata, rev

3470

self, sidedata_helpers, sidedata, rev

3469

)

3471

)

3470

flags = flags | new_flags[0] & ~new_flags[1]

3472

flags = flags | new_flags[0] & ~new_flags[1]

3471

3473

3472

with destrevlog._writing(tr):

3474

with destrevlog._writing(tr):

3473

destrevlog._addrevision(

3475

destrevlog._addrevision(

3474

node,

3476

node,

3475

rawtext,

3477

rawtext,

3476

tr,

3478

tr,

3477

linkrev,

3479

linkrev,

3478

p1,

3480

p1,

3479

p2,

3481

p2,

3480

flags,

3482

flags,

3481

cachedelta,

3483

cachedelta,

3482

deltacomputer=deltacomputer,

3484

deltacomputer=deltacomputer,

3483

sidedata=sidedata,

3485

sidedata=sidedata,

3484

)

3486

)

3485

3487

3486

if addrevisioncb:

3488

if addrevisioncb:

3487

addrevisioncb(self, rev, node)

3489

addrevisioncb(self, rev, node)

3488

3490

3489

def censorrevision(self, tr, censornode, tombstone=b''):

3491

def censorrevision(self, tr, censornode, tombstone=b''):

3490

if self._format_version == REVLOGV0:

3492

if self._format_version == REVLOGV0:

3491

raise error.RevlogError(

3493

raise error.RevlogError(

3492

_(b'cannot censor with version %d revlogs')

3494

_(b'cannot censor with version %d revlogs')

3493

% self._format_version

3495

% self._format_version

3494

)

3496

)

3495

elif self._format_version == REVLOGV1:

3497

elif self._format_version == REVLOGV1:

3496

rewrite.v1_censor(self, tr, censornode, tombstone)

3498

rewrite.v1_censor(self, tr, censornode, tombstone)

3497

else:

3499

else:

3498

rewrite.v2_censor(self, tr, censornode, tombstone)

3500

rewrite.v2_censor(self, tr, censornode, tombstone)

3499

3501

3500

def verifyintegrity(self, state):

3502

def verifyintegrity(self, state):

3501

"""Verifies the integrity of the revlog.

3503

"""Verifies the integrity of the revlog.

3502

3504

3503

Yields ``revlogproblem`` instances describing problems that are

3505

Yields ``revlogproblem`` instances describing problems that are

3504

found.

3506

found.

3505

"""

3507

"""

3506

dd, di = self.checksize()

3508

dd, di = self.checksize()

3507

if dd:

3509

if dd:

3508

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3510

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3509

if di:

3511

if di:

3510

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3512

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3511

3513

3512

version = self._format_version

3514

version = self._format_version

3513

3515

3514

# The verifier tells us what version revlog we should be.

3516

# The verifier tells us what version revlog we should be.

3515

if version != state[b'expectedversion']:

3517

if version != state[b'expectedversion']:

3516

yield revlogproblem(

3518

yield revlogproblem(

3517

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3519

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3518

% (self.display_id, version, state[b'expectedversion'])

3520

% (self.display_id, version, state[b'expectedversion'])

3519

)

3521

)

3520

3522

3521

state[b'skipread'] = set()

3523

state[b'skipread'] = set()

3522

state[b'safe_renamed'] = set()

3524

state[b'safe_renamed'] = set()

3523

3525

3524

for rev in self:

3526

for rev in self:

3525

node = self.node(rev)

3527

node = self.node(rev)

3526

3528

3527

# Verify contents. 4 cases to care about:

3529

# Verify contents. 4 cases to care about:

3528

#

3530

#

3529

# common: the most common case

3531

# common: the most common case

3530

# rename: with a rename

3532

# rename: with a rename

3531

# meta: file content starts with b'\1\n', the metadata

3533

# meta: file content starts with b'\1\n', the metadata

3532

# header defined in filelog.py, but without a rename

3534

# header defined in filelog.py, but without a rename

3533

# ext: content stored externally

3535

# ext: content stored externally

3534

#

3536

#

3535

# More formally, their differences are shown below:

3537

# More formally, their differences are shown below:

3536

#

3538

#

3537

# | common | rename | meta | ext

3539

# | common | rename | meta | ext

3538

# -------------------------------------------------------

3540

# -------------------------------------------------------

3539

# flags() | 0 | 0 | 0 | not 0

3541

# flags() | 0 | 0 | 0 | not 0

3540

# renamed() | False | True | False | ?

3542

# renamed() | False | True | False | ?

3541

# rawtext[0:2]=='\1\n'| False | True | True | ?

3543

# rawtext[0:2]=='\1\n'| False | True | True | ?

3542

#

3544

#

3543

# "rawtext" means the raw text stored in revlog data, which

3545

# "rawtext" means the raw text stored in revlog data, which

3544

# could be retrieved by "rawdata(rev)". "text"

3546

# could be retrieved by "rawdata(rev)". "text"

3545

# mentioned below is "revision(rev)".

3547

# mentioned below is "revision(rev)".

3546

#

3548

#

3547

# There are 3 different lengths stored physically:

3549

# There are 3 different lengths stored physically:

3548

# 1. L1: rawsize, stored in revlog index

3550

# 1. L1: rawsize, stored in revlog index

3549

# 2. L2: len(rawtext), stored in revlog data

3551

# 2. L2: len(rawtext), stored in revlog data

3550

# 3. L3: len(text), stored in revlog data if flags==0, or

3552

# 3. L3: len(text), stored in revlog data if flags==0, or

3551

# possibly somewhere else if flags!=0

3553

# possibly somewhere else if flags!=0

3552

#

3554

#

3553

# L1 should be equal to L2. L3 could be different from them.

3555

# L1 should be equal to L2. L3 could be different from them.

3554

# "text" may or may not affect commit hash depending on flag

3556

# "text" may or may not affect commit hash depending on flag

3555

# processors (see flagutil.addflagprocessor).

3557

# processors (see flagutil.addflagprocessor).

3556

#

3558

#

3557

# | common | rename | meta | ext

3559

# | common | rename | meta | ext

3558

# -------------------------------------------------

3560

# -------------------------------------------------

3559

# rawsize() | L1 | L1 | L1 | L1

3561

# rawsize() | L1 | L1 | L1 | L1

3560

# size() | L1 | L2-LM | L1(*) | L1 (?)

3562

# size() | L1 | L2-LM | L1(*) | L1 (?)

3561

# len(rawtext) | L2 | L2 | L2 | L2

3563

# len(rawtext) | L2 | L2 | L2 | L2

3562

# len(text) | L2 | L2 | L2 | L3

3564

# len(text) | L2 | L2 | L2 | L3

3563

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3565

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3564

#

3566

#

3565

# LM: length of metadata, depending on rawtext

3567

# LM: length of metadata, depending on rawtext

3566

# (*): not ideal, see comment in filelog.size

3568

# (*): not ideal, see comment in filelog.size

3567

# (?): could be "- len(meta)" if the resolved content has

3569

# (?): could be "- len(meta)" if the resolved content has

3568

# rename metadata

3570

# rename metadata

3569

#

3571

#

3570

# Checks needed to be done:

3572

# Checks needed to be done:

3571

# 1. length check: L1 == L2, in all cases.

3573

# 1. length check: L1 == L2, in all cases.

3572

# 2. hash check: depending on flag processor, we may need to

3574

# 2. hash check: depending on flag processor, we may need to

3573

# use either "text" (external), or "rawtext" (in revlog).

3575

# use either "text" (external), or "rawtext" (in revlog).

3574

3576

3575

try:

3577

try:

3576

skipflags = state.get(b'skipflags', 0)

3578

skipflags = state.get(b'skipflags', 0)

3577

if skipflags:

3579

if skipflags:

3578

skipflags &= self.flags(rev)

3580

skipflags &= self.flags(rev)

3579

3581

3580

_verify_revision(self, skipflags, state, node)

3582

_verify_revision(self, skipflags, state, node)

3581

3583

3582

l1 = self.rawsize(rev)

3584

l1 = self.rawsize(rev)

3583

l2 = len(self.rawdata(node))

3585

l2 = len(self.rawdata(node))

3584

3586

3585

if l1 != l2:

3587

if l1 != l2:

3586

yield revlogproblem(

3588

yield revlogproblem(

3587

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3589

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3588

node=node,

3590

node=node,

3589

)

3591

)

3590

3592

3591

except error.CensoredNodeError:

3593

except error.CensoredNodeError:

3592

if state[b'erroroncensored']:

3594

if state[b'erroroncensored']:

3593

yield revlogproblem(

3595

yield revlogproblem(

3594

error=_(b'censored file data'), node=node

3596

error=_(b'censored file data'), node=node

3595

)

3597

)

3596

state[b'skipread'].add(node)

3598

state[b'skipread'].add(node)

3597

except Exception as e:

3599

except Exception as e:

3598

yield revlogproblem(

3600

yield revlogproblem(

3599

error=_(b'unpacking %s: %s')

3601

error=_(b'unpacking %s: %s')

3600

% (short(node), stringutil.forcebytestr(e)),

3602

% (short(node), stringutil.forcebytestr(e)),

3601

node=node,

3603

node=node,

3602

)

3604

)

3603

state[b'skipread'].add(node)

3605

state[b'skipread'].add(node)

3604

3606

3605

def storageinfo(

3607

def storageinfo(

3606

self,

3608

self,

3607

exclusivefiles=False,

3609

exclusivefiles=False,

3608

sharedfiles=False,

3610

sharedfiles=False,

3609

revisionscount=False,

3611

revisionscount=False,

3610

trackedsize=False,

3612

trackedsize=False,

3611

storedsize=False,

3613

storedsize=False,

3612

):

3614

):

3613

d = {}

3615

d = {}

3614

3616

3615

if exclusivefiles:

3617

if exclusivefiles:

3616

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3618

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3617

if not self._inline:

3619

if not self._inline:

3618

d[b'exclusivefiles'].append((self.opener, self._datafile))

3620

d[b'exclusivefiles'].append((self.opener, self._datafile))

3619

3621

3620

if sharedfiles:

3622

if sharedfiles:

3621

d[b'sharedfiles'] = []

3623

d[b'sharedfiles'] = []

3622

3624

3623

if revisionscount:

3625

if revisionscount:

3624

d[b'revisionscount'] = len(self)

3626

d[b'revisionscount'] = len(self)

3625

3627

3626

if trackedsize:

3628

if trackedsize:

3627

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3629

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3628

3630

3629

if storedsize:

3631

if storedsize:

3630

d[b'storedsize'] = sum(

3632

d[b'storedsize'] = sum(

3631

self.opener.stat(path).st_size for path in self.files()

3633

self.opener.stat(path).st_size for path in self.files()

3632

)

3634

)

3633

3635

3634

return d

3636

return d

3635

3637

3636

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3638

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3637

if not self.hassidedata:

3639

if not self.hassidedata:

3638

return

3640

return

3639

# revlog formats with sidedata support does not support inline

3641

# revlog formats with sidedata support does not support inline

3640

assert not self._inline

3642

assert not self._inline

3641

if not helpers[1] and not helpers[2]:

3643

if not helpers[1] and not helpers[2]:

3642

# Nothing to generate or remove

3644

# Nothing to generate or remove

3643

return

3645

return

3644

3646

3645

new_entries = []

3647

new_entries = []

3646

# append the new sidedata

3648

# append the new sidedata

3647

with self._writing(transaction):

3649

with self._writing(transaction):

3648

ifh, dfh, sdfh = self._writinghandles

3650

ifh, dfh, sdfh = self._writinghandles

3649

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3651

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3650

3652

3651

current_offset = sdfh.tell()

3653

current_offset = sdfh.tell()

3652

for rev in range(startrev, endrev + 1):

3654

for rev in range(startrev, endrev + 1):

3653

entry = self.index[rev]

3655

entry = self.index[rev]

3654

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

3656

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

3655

store=self,

3657

store=self,

3656

sidedata_helpers=helpers,

3658

sidedata_helpers=helpers,

3657

sidedata={},

3659

sidedata={},

3658

rev=rev,

3660

rev=rev,

3659

)

3661

)

3660

3662

3661

serialized_sidedata = sidedatautil.serialize_sidedata(

3663

serialized_sidedata = sidedatautil.serialize_sidedata(

3662

new_sidedata

3664

new_sidedata

3663

)

3665

)

3664

3666

3665

sidedata_compression_mode = COMP_MODE_INLINE

3667

sidedata_compression_mode = COMP_MODE_INLINE

3666

if serialized_sidedata and self.hassidedata:

3668

if serialized_sidedata and self.hassidedata:

3667

sidedata_compression_mode = COMP_MODE_PLAIN

3669

sidedata_compression_mode = COMP_MODE_PLAIN

3668

h, comp_sidedata = self.compress(serialized_sidedata)

3670

h, comp_sidedata = self.compress(serialized_sidedata)

3669

if (

3671

if (

3670

h != b'u'

3672

h != b'u'

3671

and comp_sidedata[0] != b'\0'

3673

and comp_sidedata[0] != b'\0'

3672

and len(comp_sidedata) < len(serialized_sidedata)

3674

and len(comp_sidedata) < len(serialized_sidedata)

3673

):

3675

):

3674

assert not h

3676

assert not h

3675

if (

3677

if (

3676

comp_sidedata[0]

3678

comp_sidedata[0]

3677

== self._docket.default_compression_header

3679

== self._docket.default_compression_header

3678

):

3680

):

3679

sidedata_compression_mode = COMP_MODE_DEFAULT

3681

sidedata_compression_mode = COMP_MODE_DEFAULT

3680

serialized_sidedata = comp_sidedata

3682

serialized_sidedata = comp_sidedata

3681

else:

3683

else:

3682

sidedata_compression_mode = COMP_MODE_INLINE

3684

sidedata_compression_mode = COMP_MODE_INLINE

3683

serialized_sidedata = comp_sidedata

3685

serialized_sidedata = comp_sidedata

3684

if entry[8] != 0 or entry[9] != 0:

3686

if entry[8] != 0 or entry[9] != 0:

3685

# rewriting entries that already have sidedata is not

3687

# rewriting entries that already have sidedata is not

3686

# supported yet, because it introduces garbage data in the

3688

# supported yet, because it introduces garbage data in the

3687

# revlog.

3689

# revlog.

3688

msg = b"rewriting existing sidedata is not supported yet"

3690

msg = b"rewriting existing sidedata is not supported yet"

3689

raise error.Abort(msg)

3691

raise error.Abort(msg)

3690

3692

3691

# Apply (potential) flags to add and to remove after running

3693

# Apply (potential) flags to add and to remove after running

3692

# the sidedata helpers

3694

# the sidedata helpers

3693

new_offset_flags = entry[0] | flags[0] & ~flags[1]

3695

new_offset_flags = entry[0] | flags[0] & ~flags[1]

3694

entry_update = (

3696

entry_update = (

3695

current_offset,

3697

current_offset,

3696

len(serialized_sidedata),

3698

len(serialized_sidedata),

3697

new_offset_flags,

3699

new_offset_flags,

3698

sidedata_compression_mode,

3700

sidedata_compression_mode,

3699

)

3701

)

3700

3702

3701

# the sidedata computation might have move the file cursors around

3703

# the sidedata computation might have move the file cursors around

3702

sdfh.seek(current_offset, os.SEEK_SET)

3704

sdfh.seek(current_offset, os.SEEK_SET)

3703

sdfh.write(serialized_sidedata)

3705

sdfh.write(serialized_sidedata)

3704

new_entries.append(entry_update)

3706

new_entries.append(entry_update)

3705

current_offset += len(serialized_sidedata)

3707

current_offset += len(serialized_sidedata)

3706

self._docket.sidedata_end = sdfh.tell()

3708

self._docket.sidedata_end = sdfh.tell()

3707

3709

3708

# rewrite the new index entries

3710

# rewrite the new index entries

3709

ifh.seek(startrev * self.index.entry_size)

3711

ifh.seek(startrev * self.index.entry_size)

3710

for i, e in enumerate(new_entries):

3712

for i, e in enumerate(new_entries):

3711

rev = startrev + i

3713

rev = startrev + i

3712

self.index.replace_sidedata_info(rev, *e)

3714

self.index.replace_sidedata_info(rev, *e)

3713

packed = self.index.entry_binary(rev)

3715

packed = self.index.entry_binary(rev)

3714

if rev == 0 and self._docket is None:

3716

if rev == 0 and self._docket is None:

3715

header = self._format_flags | self._format_version

3717

header = self._format_flags | self._format_version

3716

header = self.index.pack_header(header)

3718

header = self.index.pack_header(header)

3717

packed = header + packed

3719

packed = header + packed

3718

ifh.write(packed)

3720

ifh.write(packed)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             # coding: utf8
             #
             # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             import binascii
             import collections
             import contextlib
             import io
             import os
             import struct
             import weakref
             import zlib
             # import stuff from node for others to import from revlog
             from .node import (
                 bin,
                 hex,
                 nullrev,
                 sha1nodeconstants,
                 short,
                 wdirrev,
             )
             from .i18n import _
             from .revlogutils.constants import (
                 ALL_KINDS,
                 CHANGELOGV2,
                 COMP_MODE_DEFAULT,
                 COMP_MODE_INLINE,
                 COMP_MODE_PLAIN,
                 DELTA_BASE_REUSE_NO,
                 DELTA_BASE_REUSE_TRY,
                 ENTRY_RANK,
                 FEATURES_BY_VERSION,
                 FLAG_GENERALDELTA,
                 FLAG_INLINE_DATA,
                 INDEX_HEADER,
                 KIND_CHANGELOG,
                 KIND_FILELOG,
                 RANK_UNKNOWN,
                 REVLOGV0,
                 REVLOGV1,
                 REVLOGV1_FLAGS,
                 REVLOGV2,
                 REVLOGV2_FLAGS,
                 REVLOG_DEFAULT_FLAGS,
                 REVLOG_DEFAULT_FORMAT,
                 REVLOG_DEFAULT_VERSION,
                 SUPPORTED_FLAGS,
             )
             from .revlogutils.flagutil import (
                 REVIDX_DEFAULT_FLAGS,
                 REVIDX_ELLIPSIS,
                 REVIDX_EXTSTORED,
                 REVIDX_FLAGS_ORDER,
                 REVIDX_HASCOPIESINFO,
                 REVIDX_ISCENSORED,
                 REVIDX_RAWTEXT_CHANGING_FLAGS,
             )
             from .thirdparty import attr
             from . import (
                 ancestor,
                 dagop,
                 error,
                 mdiff,
                 policy,
                 pycompat,
                 revlogutils,
                 templatefilters,
                 util,
             )
             from .interfaces import (
                 repository,
                 util as interfaceutil,
             )
             from .revlogutils import (
                 deltas as deltautil,
                 docket as docketutil,
                 flagutil,
                 nodemap as nodemaputil,
                 randomaccessfile,
                 revlogv0,
                 rewrite,
                 sidedata as sidedatautil,
             )
             from .utils import (
                 storageutil,
                 stringutil,
             )
             # blanked usage of all the name to prevent pyflakes constraints
             # We need these name available in the module for extensions.
             REVLOGV0
             REVLOGV1
             REVLOGV2
             CHANGELOGV2
             FLAG_INLINE_DATA
             FLAG_GENERALDELTA
             REVLOG_DEFAULT_FLAGS
             REVLOG_DEFAULT_FORMAT
             REVLOG_DEFAULT_VERSION
             REVLOGV1_FLAGS
             REVLOGV2_FLAGS
             REVIDX_ISCENSORED
             REVIDX_ELLIPSIS
             REVIDX_HASCOPIESINFO
             REVIDX_EXTSTORED
             REVIDX_DEFAULT_FLAGS
             REVIDX_FLAGS_ORDER
             REVIDX_RAWTEXT_CHANGING_FLAGS
             parsers = policy.importmod('parsers')
             rustancestor = policy.importrust('ancestor')
             rustdagop = policy.importrust('dagop')
             rustrevlog = policy.importrust('revlog')
             # Aliased for performance.
             _zlibdecompress = zlib.decompress
             # max size of inline data embedded into a revlog
             _maxinline = 131072
             # Flag processors for REVIDX_ELLIPSIS.
             def ellipsisreadprocessor(rl, text):
                 return text, False
             def ellipsiswriteprocessor(rl, text):
                 return text, False
             def ellipsisrawprocessor(rl, text):
                 return False
             ellipsisprocessor = (
                 ellipsisreadprocessor,
                 ellipsiswriteprocessor,
                 ellipsisrawprocessor,
             )
             def _verify_revision(rl, skipflags, state, node):
                 """Verify the integrity of the given revlog ``node`` while providing a hook
                 point for extensions to influence the operation."""
                 if skipflags:
                     state[b'skipread'].add(node)
                 else:
                     # Side-effect: read content and verify hash.
                     rl.revision(node)
             # True if a fast implementation for persistent-nodemap is available
             #
             # We also consider we have a "fast" implementation in "pure" python because
             # people using pure don't really have performance consideration (and a
             # wheelbarrow of other slowness source)
             HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(
                 parsers, 'BaseIndexObject'
             )
             @interfaceutil.implementer(repository.irevisiondelta)
             @attr.s(slots=True)
             class revlogrevisiondelta:
                 node = attr.ib()
                 p1node = attr.ib()
                 p2node = attr.ib()
                 basenode = attr.ib()
                 flags = attr.ib()
                 baserevisionsize = attr.ib()
                 revision = attr.ib()
                 delta = attr.ib()
                 sidedata = attr.ib()
                 protocol_flags = attr.ib()
                 linknode = attr.ib(default=None)
             @interfaceutil.implementer(repository.iverifyproblem)
             @attr.s(frozen=True)
             class revlogproblem:
                 warning = attr.ib(default=None)
                 error = attr.ib(default=None)
                 node = attr.ib(default=None)
             def parse_index_v1(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline)
                 return index, cache
             def parse_index_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)
                 return index, cache
             def parse_index_cl_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)
                 return index, cache
             if hasattr(parsers, 'parse_index_devel_nodemap'):
                 def parse_index_v1_nodemap(data, inline):
                     index, cache = parsers.parse_index_devel_nodemap(data, inline)
                     return index, cache
             else:
                 parse_index_v1_nodemap = None
             def parse_index_v1_mixed(data, inline):
                 index, cache = parse_index_v1(data, inline)
                 return rustrevlog.MixedIndex(index), cache
             # corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
             # signed integer)
             _maxentrysize = 0x7FFFFFFF
             FILE_TOO_SHORT_MSG = _(
                 b'cannot read from revlog %s;'
                 b'  expected %d bytes from offset %d, data size is %d'
             )
             hexdigits = b'0123456789abcdefABCDEF'
             class _Config:
                 def copy(self):
                     return self.__class__(**self.__dict__)
             @attr.s()
             class FeatureConfig(_Config):
                 """Hold configuration values about the available revlog features"""
                 # the default compression engine
                 compression_engine = attr.ib(default=b'zlib')
                 # compression engines options
                 compression_engine_options = attr.ib(default=attr.Factory(dict))
                 # can we use censor on this revlog
                 censorable = attr.ib(default=False)
                 # does this revlog use the "side data" feature
                 has_side_data = attr.ib(default=False)
                 # might remove rank configuration once the computation has no impact
                 compute_rank = attr.ib(default=False)
                 # parent order is supposed to be semantically irrelevant, so we
                 # normally resort parents to ensure that the first parent is non-null,
                 # if there is a non-null parent at all.
                 # filelog abuses the parent order as flag to mark some instances of
                 # meta-encoded files, so allow it to disable this behavior.
                 canonical_parent_order = attr.ib(default=False)
                 # can ellipsis commit be used
                 enable_ellipsis = attr.ib(default=False)
                 def copy(self):
                     new = super().copy()
                     new.compression_engine_options = self.compression_engine_options.copy()
                     return new
             @attr.s()
             class DataConfig(_Config):
                 """Hold configuration value about how the revlog data are read"""
                 # should we try to open the "pending" version of the revlog
                 try_pending = attr.ib(default=False)
                 # should we try to open the "splitted" version of the revlog
                 try_split = attr.ib(default=False)
                 #  When True, indexfile should be opened with checkambig=True at writing,
                 #  to avoid file stat ambiguity.
                 check_ambig = attr.ib(default=False)
                 # If true, use mmap instead of reading to deal with large index
                 mmap_large_index = attr.ib(default=False)
                 # how much data is large
                 mmap_index_threshold = attr.ib(default=None)
                 # How much data to read and cache into the raw revlog data cache.
                 chunk_cache_size = attr.ib(default=65536)
                 # Allow sparse reading of the revlog data
                 with_sparse_read = attr.ib(default=False)
                 # minimal density of a sparse read chunk
                 sr_density_threshold = attr.ib(default=0.50)
                 # minimal size of data we skip when performing sparse read
                 sr_min_gap_size = attr.ib(default=262144)
                 # are delta encoded against arbitrary bases.
                 generaldelta = attr.ib(default=False)
             @attr.s()
             class DeltaConfig(_Config):
                 """Hold configuration value about how new delta are computed
                 Some attributes are duplicated from DataConfig to help havign each object
                 self contained.
                 """
                 # can delta be encoded against arbitrary bases.
                 general_delta = attr.ib(default=False)
                 # Allow sparse writing of the revlog data
                 sparse_revlog = attr.ib(default=False)
                 # maximum length of a delta chain
                 max_chain_len = attr.ib(default=None)
                 # Maximum distance between delta chain base start and end
                 max_deltachain_span = attr.ib(default=-1)
                 # If `upper_bound_comp` is not None, this is the expected maximal gain from
                 # compression for the data content.
                 upper_bound_comp = attr.ib(default=None)
                 # Should we try a delta against both parent
                 delta_both_parents = attr.ib(default=True)
                 # Test delta base candidate group by chunk of this maximal size.
                 candidate_group_chunk_size = attr.ib(default=0)
                 # Should we display debug information about delta computation
                 debug_delta = attr.ib(default=False)
                 # trust incoming delta by default
                 lazy_delta = attr.ib(default=True)
                 # trust the base of incoming delta by default
                 lazy_delta_base = attr.ib(default=False)
             class revlog:
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 If checkambig, indexfile is opened with checkambig=True at
                 writing, to avoid file stat ambiguity.
                 If mmaplargeindex is True, and an mmapindexthreshold is set, the
                 index will be mmapped rather than read if it is larger than the
                 configured threshold.
                 If censorable is True, the revlog can have censored revisions.
                 If `upperboundcomp` is not None, this is the expected maximal gain from
                 compression for the data content.
                 `concurrencychecker` is an optional function that receives 3 arguments: a
                 file handle, a filename, and an expected position. It should check whether
                 the current position in the file handle is valid, and log/warn/fail (by
                 raising).
                 See mercurial/revlogutils/contants.py for details about the content of an
                 index entry.
                 """
                 _flagserrorclass = error.RevlogError
                 @staticmethod
                 def is_inline_index(header_bytes):
                     """Determine if a revlog is inline from the initial bytes of the index"""
                     header = INDEX_HEADER.unpack(header_bytes)[0]
                     _format_flags = header & ~0xFFFF
                     _format_version = header & 0xFFFF
                     features = FEATURES_BY_VERSION[_format_version]
                     return features[b'inline'](_format_flags)
                 def __init__(
                     self,
                     opener,
                     target,
                     radix,
                     postfix=None,  # only exist for `tmpcensored` now
                     checkambig=False,
                     mmaplargeindex=False,
                     censorable=False,
                     upperboundcomp=None,
                     persistentnodemap=False,
                     concurrencychecker=None,
                     trypending=False,
                     try_split=False,
                     canonical_parent_order=True,
                 ):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     `target`: a (KIND, ID) tuple that identify the content stored in
                     this revlog. It help the rest of the code to understand what the revlog
                     is about without having to resort to heuristic and index filename
                     analysis. Note: that this must be reliably be set by normal code, but
                     that test, debug, or performance measurement code might not set this to
                     accurate value.
                     """
                     self.upperboundcomp = upperboundcomp
                     self.radix = radix
                     self._docket_file = None
                     self._indexfile = None
                     self._datafile = None
                     self._sidedatafile = None
                     self._nodemap_file = None
                     self.postfix = postfix
                     self._trypending = trypending
                     self._try_split = try_split
                     self.opener = opener
                     if persistentnodemap:
                         self._nodemap_file = nodemaputil.get_nodemap_file(self)
                     assert target[0] in ALL_KINDS
                     assert len(target) == 2
                     self.target = target
                     if b'feature-config' in self.opener.options:
                         self.feature_config = self.opener.options[b'feature-config'].copy()
                     else:
                         self.feature_config = FeatureConfig()
                     self.feature_config.censorable = censorable
                     self.feature_config.canonical_parent_order = canonical_parent_order
                     if b'data-config' in self.opener.options:
                         self.data_config = self.opener.options[b'data-config'].copy()
                     else:
                         self.data_config = DataConfig()
                     self.data_config.check_ambig = checkambig
                     self.data_config.mmap_large_index = mmaplargeindex
                     if b'delta-config' in self.opener.options:
                         self.delta_config = self.opener.options[b'delta-config'].copy()
                     else:
                         self.delta_config = DeltaConfig()
                     # 3-tuple of (node, rev, text) for a raw revision.
                     self._revisioncache = None
                     # Maps rev to chain base rev.
                     self._chainbasecache = util.lrucachedict(100)
                     # 2-tuple of (offset, data) of raw data from the revlog at an offset.
                     self._chunkcache = (0, b'')
                     self.index = None
                     self._docket = None
                     self._nodemap_docket = None
                     # Mapping of partial identifiers to full nodes.
                     self._pcache = {}
                     # other optionnals features
                     # Make copy of flag processors so each revlog instance can support
                     # custom flags.
                     self._flagprocessors = dict(flagutil.flagprocessors)
                     # 3-tuple of file handles being used for active writing.
                     self._writinghandles = None
                     # prevent nesting of addgroup
                     self._adding_group = None
                     self._loadindex()
                     self._concurrencychecker = concurrencychecker
                 @property
                 def _generaldelta(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.general_delta
                 @property
                 def _checkambig(self):
                     """temporary compatibility proxy"""
                     return self.data_config.check_ambig
                 @property
                 def _mmaplargeindex(self):
                     """temporary compatibility proxy"""
                     return self.data_config.mmap_large_index
                 @property
                 def _censorable(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.censorable
                 @property
                 def _chunkcachesize(self):
                     """temporary compatibility proxy"""
                     return self.data_config.chunk_cache_size
                 @property
                 def _maxchainlen(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.max_chain_len
                 @property
                 def _deltabothparents(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.delta_both_parents
                 @property
                 def _candidate_group_chunk_size(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.candidate_group_chunk_size
                 @property
                 def _debug_delta(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.debug_delta
                 @property
                 def _compengine(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.compression_engine
                 @property
                 def _compengineopts(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.compression_engine_options
                 @property
                 def _maxdeltachainspan(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.max_deltachain_span
                 @property
                 def _withsparseread(self):
                     """temporary compatibility proxy"""
                     return self.data_config.with_sparse_read
                 @property
                 def _sparserevlog(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.sparse_revlog
                 @property
                 def hassidedata(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.has_side_data
                 @property
                 def _srdensitythreshold(self):
                     """temporary compatibility proxy"""
                     return self.data_config.sr_density_threshold
                 @property
                 def _srmingapsize(self):
                     """temporary compatibility proxy"""
                     return self.data_config.sr_min_gap_size
                 @property
                 def _compute_rank(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.compute_rank
                 @property
                 def canonical_parent_order(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.canonical_parent_order
                 @property
                 def _lazydelta(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.lazy_delta
                 @property
                 def _lazydeltabase(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.lazy_delta_base
                 def _init_opts(self):
                     """process options (from above/config) to setup associated default revlog mode
                     These values might be affected when actually reading on disk information.
                     The relevant values are returned for use in _loadindex().
                     * newversionflags:
                         version header to use if we need to create a new revlog
                     * mmapindexthreshold:
                         minimal index size for start to use mmap
                     * force_nodemap:
                         force the usage of a "development" version of the nodemap code
                     """
                     opts = self.opener.options
                     if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:
                         new_header = CHANGELOGV2
                         compute_rank = opts.get(b'changelogv2.compute-rank', True)
                         self.feature_config.compute_rank = compute_rank
                     elif b'revlogv2' in opts:
                         new_header = REVLOGV2
                     elif b'revlogv1' in opts:
                         new_header = REVLOGV1 | FLAG_INLINE_DATA
                         if b'generaldelta' in opts:
                             new_header |= FLAG_GENERALDELTA
                     elif b'revlogv0' in self.opener.options:
                         new_header = REVLOGV0
                     else:
                         new_header = REVLOG_DEFAULT_VERSION
                     mmapindexthreshold = None
                     if self.data_config.mmap_large_index:
                         mmapindexthreshold = self.data_config.mmap_index_threshold
                     if self.feature_config.enable_ellipsis:
                         self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor
                     # revlog v0 doesn't have flag processors
                     for flag, processor in opts.get(b'flagprocessors', {}).items():
                         flagutil.insertflagprocessor(flag, processor, self._flagprocessors)
                     chunk_cache_size = self.data_config.chunk_cache_size
                     if chunk_cache_size <= 0:
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not greater than 0')
                             % chunk_cache_size
                         )
                     elif chunk_cache_size & (chunk_cache_size - 1):
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not a power of 2')
                             % chunk_cache_size
                         )
                     force_nodemap = opts.get(b'devel-force-nodemap', False)
                     return new_header, mmapindexthreshold, force_nodemap
                 def _get_data(self, filepath, mmap_threshold, size=None):
                     """return a file content with or without mmap
                     If the file is missing return the empty string"""
                     try:
                         with self.opener(filepath) as fp:
                             if mmap_threshold is not None:
                                 file_size = self.opener.fstat(fp).st_size
                                 if file_size >= mmap_threshold:
                                     if size is not None:
                                         # avoid potentiel mmap crash
                                         size = min(file_size, size)
                                     # TODO: should .close() to release resources without
                                     # relying on Python GC
                                     if size is None:
                                         return util.buffer(util.mmapread(fp))
                                     else:
                                         return util.buffer(util.mmapread(fp, size))
                             if size is None:
                                 return fp.read()
                             else:
                                 return fp.read(size)
                     except FileNotFoundError:
                         return b''
                 def get_streams(self, max_linkrev, force_inline=False):
                     """return a list of streams that represent this revlog
                     This is used by stream-clone to do bytes to bytes copies of a repository.
                     This streams data for all revisions that refer to a changelog revision up
                     to `max_linkrev`.
                     If `force_inline` is set, it enforces that the stream will represent an inline revlog.
                     It returns is a list of three-tuple:
                         [
                             (filename, bytes_stream, stream_size),
                             …
                         ]
                     """
                     n = len(self)
                     index = self.index
                     while n > 0:
                         linkrev = index[n - 1][4]
                         if linkrev < max_linkrev:
                             break
                         # note: this loop will rarely go through multiple iterations, since
                         # it only traverses commits created during the current streaming
                         # pull operation.
                         #
                         # If this become a problem, using a binary search should cap the
                         # runtime of this.
                         n = n - 1
                     if n == 0:
                         # no data to send
                         return []
                     index_size = n * index.entry_size
                     data_size = self.end(n - 1)
                     # XXX we might have been split (or stripped) since the object
                     # initialization, We need to close this race too, but having a way to
                     # pre-open the file we feed to the revlog and never closing them before
                     # we are done streaming.
                     if self._inline:
                         def get_stream():
                             with self._indexfp() as fp:
                                 yield None
                                 size = index_size + data_size
                                 if size <= 65536:
                                     yield fp.read(size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=size)
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     elif force_inline:
                         def get_stream():
                             with self.reading():
                                 yield None
                                 for rev in range(n):
                                     idx = self.index.entry_binary(rev)
                                     if rev == 0 and self._docket is None:
                                         # re-inject the inline flag
                                         header = self._format_flags
                                         header |= self._format_version
                                         header |= FLAG_INLINE_DATA
                                         header = self.index.pack_header(header)
                                         idx = header + idx
                                     yield idx
                                     yield self._getsegmentforrevs(rev, rev)[1]
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     else:
                         def get_index_stream():
                             with self._indexfp() as fp:
                                 yield None
                                 if index_size <= 65536:
                                     yield fp.read(index_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=index_size)
                         def get_data_stream():
                             with self._datafp() as fp:
                                 yield None
                                 if data_size <= 65536:
                                     yield fp.read(data_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=data_size)
                         index_stream = get_index_stream()
                         next(index_stream)
                         data_stream = get_data_stream()
                         next(data_stream)
                         return [
                             (self._datafile, data_stream, data_size),
                             (self._indexfile, index_stream, index_size),
                         ]
                 def _loadindex(self, docket=None):
                     new_header, mmapindexthreshold, force_nodemap = self._init_opts()
                     if self.postfix is not None:
                         entry_point = b'%s.i.%s' % (self.radix, self.postfix)
                     elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):
                         entry_point = b'%s.i.a' % self.radix
                     elif self._try_split and self.opener.exists(self._split_index_file):
                         entry_point = self._split_index_file
                     else:
                         entry_point = b'%s.i' % self.radix
                     if docket is not None:
                         self._docket = docket
                         self._docket_file = entry_point
                     else:
                         self._initempty = True
                         entry_data = self._get_data(entry_point, mmapindexthreshold)
                         if len(entry_data) > 0:
                             header = INDEX_HEADER.unpack(entry_data[:4])[0]
                             self._initempty = False
                         else:
                             header = new_header
                         self._format_flags = header & ~0xFFFF
                         self._format_version = header & 0xFFFF
                         supported_flags = SUPPORTED_FLAGS.get(self._format_version)
                         if supported_flags is None:
                             msg = _(b'unknown version (%d) in revlog %s')
                             msg %= (self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         elif self._format_flags & ~supported_flags:
                             msg = _(b'unknown flags (%#04x) in version %d revlog %s')
                             display_flag = self._format_flags >> 16
                             msg %= (display_flag, self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         features = FEATURES_BY_VERSION[self._format_version]
                         self._inline = features[b'inline'](self._format_flags)
                         self.delta_config.general_delta = features[b'generaldelta'](
                             self._format_flags
                         )
                         self.feature_config.has_side_data = features[b'sidedata']
                         if not features[b'docket']:
                             self._indexfile = entry_point
                             index_data = entry_data
                         else:
                             self._docket_file = entry_point
                             if self._initempty:
                                 self._docket = docketutil.default_docket(self, header)
                             else:
                                 self._docket = docketutil.parse_docket(
                                     self, entry_data, use_pending=self._trypending
                                 )
                     if self._docket is not None:
                         self._indexfile = self._docket.index_filepath()
                         index_data = b''
                         index_size = self._docket.index_end
                         if index_size > 0:
                             index_data = self._get_data(
                                 self._indexfile, mmapindexthreshold, size=index_size
                             )
                             if len(index_data) < index_size:
                                 msg = _(b'too few index data for %s: got %d, expected %d')
                                 msg %= (self.display_id, len(index_data), index_size)
                                 raise error.RevlogError(msg)
                         self._inline = False
                         # generaldelta implied by version 2 revlogs.
                         self.delta_config.general_delta = True
                         # the logic for persistent nodemap will be dealt with within the
                         # main docket, so disable it for now.
                         self._nodemap_file = None
                     if self._docket is not None:
                         self._datafile = self._docket.data_filepath()
                         self._sidedatafile = self._docket.sidedata_filepath()
                     elif self.postfix is None:
                         self._datafile = b'%s.d' % self.radix
                     else:
                         self._datafile = b'%s.d.%s' % (self.radix, self.postfix)
                     self.nodeconstants = sha1nodeconstants
                     self.nullid = self.nodeconstants.nullid
                     # sparse-revlog can't be on without general-delta (issue6056)
                     if not self.delta_config.general_delta:
                         self.delta_config.sparse_revlog = False
                     self._storedeltachains = True
                     devel_nodemap = (
                         self._nodemap_file
                         and force_nodemap
                         and parse_index_v1_nodemap is not None
                     )
                     use_rust_index = False
                     if rustrevlog is not None:
                         if self._nodemap_file is not None:
                             use_rust_index = True
                         else:
                             use_rust_index = self.opener.options.get(b'rust.index')
                     self._parse_index = parse_index_v1
                     if self._format_version == REVLOGV0:
                         self._parse_index = revlogv0.parse_index_v0
                     elif self._format_version == REVLOGV2:
                         self._parse_index = parse_index_v2
                     elif self._format_version == CHANGELOGV2:
                         self._parse_index = parse_index_cl_v2
                     elif devel_nodemap:
                         self._parse_index = parse_index_v1_nodemap
                     elif use_rust_index:
                         self._parse_index = parse_index_v1_mixed
                     try:
                         d = self._parse_index(index_data, self._inline)
                         index, chunkcache = d
                         use_nodemap = (
                             not self._inline
                             and self._nodemap_file is not None
                             and hasattr(index, 'update_nodemap_data')
                         )
                         if use_nodemap:
                             nodemap_data = nodemaputil.persisted_data(self)
                             if nodemap_data is not None:
                                 docket = nodemap_data[0]
                                 if (
                                     len(d[0]) > docket.tip_rev
                                     and d[0][docket.tip_rev][7] == docket.tip_node
                                 ):
                                     # no changelog tampering
                                     self._nodemap_docket = docket
                                     index.update_nodemap_data(*nodemap_data)
                     except (ValueError, IndexError):
                         raise error.RevlogError(
                             _(b"index %s is corrupted") % self.display_id
                         )
                     self.index = index
                     self._segmentfile = randomaccessfile.randomaccessfile(
                         self.opener,
                         (self._indexfile if self._inline else self._datafile),
                         self._chunkcachesize,
                         chunkcache,
                     )
                     self._segmentfile_sidedata = randomaccessfile.randomaccessfile(
                         self.opener,
                         self._sidedatafile,
                         self._chunkcachesize,
                     )
                     # revnum -> (chain-length, sum-delta-length)
                     self._chaininfocache = util.lrucachedict(500)
                     # revlog header -> revlog compressor
                     self._decompressors = {}
                 def get_revlog(self):
                     """simple function to mirror API of other not-really-revlog API"""
                     return self
                 @util.propertycache
                 def revlog_kind(self):
                     return self.target[0]
                 @util.propertycache
                 def display_id(self):
                     """The public facing "ID" of the revlog that we use in message"""
                     if self.revlog_kind == KIND_FILELOG:
                         # Reference the file without the "data/" prefix, so it is familiar
                         # to the user.
                         return self.target[1]
                     else:
                         return self.radix
                 def _get_decompressor(self, t):
                     try:
                         compressor = self._decompressors[t]
                     except KeyError:
                         try:
                             engine = util.compengines.forrevlogheader(t)
                             compressor = engine.revlogcompressor(self._compengineopts)
                             self._decompressors[t] = compressor
                         except KeyError:
                             raise error.RevlogError(
                                 _(b'unknown compression type %s') % binascii.hexlify(t)
                             )
                     return compressor
                 @util.propertycache
                 def _compressor(self):
                     engine = util.compengines[self._compengine]
                     return engine.revlogcompressor(self._compengineopts)
                 @util.propertycache
                 def _decompressor(self):
                     """the default decompressor"""
                     if self._docket is None:
                         return None
                     t = self._docket.default_compression_header
                     c = self._get_decompressor(t)
                     return c.decompress
                 def _indexfp(self):
                     """file object for the revlog's index file"""
                     return self.opener(self._indexfile, mode=b"r")
                 def __index_write_fp(self):
                     # You should not use this directly and use `_writing` instead
                     try:
                         f = self.opener(
                             self._indexfile,
                             mode=b"r+",
                             checkambig=self.data_config.check_ambig,
                         )
                         if self._docket is None:
                             f.seek(0, os.SEEK_END)
                         else:
                             f.seek(self._docket.index_end, os.SEEK_SET)
                         return f
                     except FileNotFoundError:
                         return self.opener(
                             self._indexfile,
                             mode=b"w+",
                             checkambig=self.data_config.check_ambig,
                         )
                 def __index_new_fp(self):
                     # You should not use this unless you are upgrading from inline revlog
                     return self.opener(
                         self._indexfile,
                         mode=b"w",
                         checkambig=self.data_config.check_ambig,
                         atomictemp=True,
                     )
                 def _datafp(self, mode=b'r'):
                     """file object for the revlog's data file"""
                     return self.opener(self._datafile, mode=mode)
                 @contextlib.contextmanager
                 def _sidedatareadfp(self):
                     """file object suitable to read sidedata"""
                     if self._writinghandles:
                         yield self._writinghandles[2]
                     else:
                         with self.opener(self._sidedatafile) as fp:
                             yield fp
                 def tiprev(self):
                     return len(self.index) - 1
                 def tip(self):
                     return self.node(self.tiprev())
                 def __contains__(self, rev):
                     return 0 <= rev < len(self)
                 def __len__(self):
                     return len(self.index)
                 def __iter__(self):
                     return iter(range(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     return storageutil.iterrevs(len(self), start=start, stop=stop)
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def _candelta(self, baserev, rev):
                     """whether two revisions (baserev, rev) can be delta-ed or not"""
                     # Disable delta if either rev requires a content-changing flag
                     # processor (ex. LFS). This is because such flag processor can alter
                     # the rawtext content that the delta will be based on, and two clients
                     # could have a same revlog node with different flags (i.e. different
                     # rawtext contents) and the delta could be incompatible.
                     if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (
                         self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS
                     ):
                         return False
                     return True
                 def update_caches(self, transaction):
                     """update on disk cache
                     If a transaction is passed, the update may be delayed to transaction
                     commit."""
                     if self._nodemap_file is not None:
                         if transaction is None:
                             nodemaputil.update_persistent_nodemap(self)
                         else:
                             nodemaputil.setup_persistent_nodemap(transaction, self)
                 def clearcaches(self):
                     """Clear in-memory caches"""
                     self._revisioncache = None
                     self._chainbasecache.clear()
                     self._segmentfile.clear_cache()
                     self._segmentfile_sidedata.clear_cache()
                     self._pcache = {}
                     self._nodemap_docket = None
                     self.index.clearcaches()
                     # The python code is the one responsible for validating the docket, we
                     # end up having to refresh it here.
                     use_nodemap = (
                         not self._inline
                         and self._nodemap_file is not None
                         and hasattr(self.index, 'update_nodemap_data')
                     )
                     if use_nodemap:
                         nodemap_data = nodemaputil.persisted_data(self)
                         if nodemap_data is not None:
                             self._nodemap_docket = nodemap_data[0]
                             self.index.update_nodemap_data(*nodemap_data)
                 def rev(self, node):
                     """return the revision number associated with a <nodeid>"""
                     try:
                         return self.index.rev(node)
                     except TypeError:
                         raise
                     except error.RevlogError:
                         # parsers.c radix tree lookup failed
                         if (
                             node == self.nodeconstants.wdirid
                             or node in self.nodeconstants.wdirfilenodeids
                         ):
                             raise error.WdirUnsupported
                         raise error.LookupError(node, self.display_id, _(b'no node'))
                 # Accessors for index entries.
                 # First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
                 # are flags.
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def sidedata_cut_off(self, rev):
                     sd_cut_off = self.index[rev][8]
                     if sd_cut_off != 0:
                         return sd_cut_off
                     # This is some annoying dance, because entries without sidedata
                     # currently use 0 as their ofsset. (instead of previous-offset +
                     # previous-size)
                     #
                     # We should reconsider this sidedata → 0 sidata_offset policy.
                     # In the meantime, we need this.
                     while 0 <= rev:
                         e = self.index[rev]
                         if e[9] != 0:
                             return e[8] + e[9]
                         rev -= 1
                     return 0
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def length(self, rev):
                     return self.index[rev][1]
                 def sidedata_length(self, rev):
                     if not self.hassidedata:
                         return 0
                     return self.index[rev][9]
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.rawdata(rev)
                     return len(t)
                 def size(self, rev):
                     """length of non-raw text (processed by a "read" flag processor)"""
                     # fast path: if no "read" flag processor could change the content,
                     # size is rawsize. note: ELLIPSIS is known to not change the content.
                     flags = self.flags(rev)
                     if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
                         return self.rawsize(rev)
                     return len(self.revision(rev))
                 def fast_rank(self, rev):
                     """Return the rank of a revision if already known, or None otherwise.
                     The rank of a revision is the size of the sub-graph it defines as a
                     head. Equivalently, the rank of a revision `r` is the size of the set
                     `ancestors(r)`, `r` included.
                     This method returns the rank retrieved from the revlog in constant
                     time. It makes no attempt at computing unknown values for versions of
                     the revlog which do not persist the rank.
                     """
                     rank = self.index[rev][ENTRY_RANK]
                     if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:
                         return None
                     if rev == nullrev:
                         return 0  # convention
                     return rank
                 def chainbase(self, rev):
                     base = self._chainbasecache.get(rev)
                     if base is not None:
                         return base
                     index = self.index
                     iterrev = rev
                     base = index[iterrev][3]
                     while base != iterrev:
                         iterrev = base
                         base = index[iterrev][3]
                     self._chainbasecache[rev] = base
                     return base
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parentrevs(self, rev):
                     try:
                         entry = self.index[rev]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                     if self.canonical_parent_order and entry[5] == nullrev:
                         return entry[6], entry[5]
                     else:
                         return entry[5], entry[6]
                 # fast parentrevs(rev) where rev isn't filtered
                 _uncheckedparentrevs = parentrevs
                 def node(self, rev):
                     try:
                         return self.index[rev][7]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                 # Derived from index values.
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     # inline node() to avoid function call overhead
                     if self.canonical_parent_order and d[5] == self.nullid:
                         return i[d[6]][7], i[d[5]][7]
                     else:
                         return i[d[5]][7], i[d[6]][7]
                 def chainlen(self, rev):
                     return self._chaininfo(rev)[0]
                 def _chaininfo(self, rev):
                     chaininfocache = self._chaininfocache
                     if rev in chaininfocache:
                         return chaininfocache[rev]
                     index = self.index
                     generaldelta = self.delta_config.general_delta
                     iterrev = rev
                     e = index[iterrev]
                     clen = 0
                     compresseddeltalen = 0
                     while iterrev != e[3]:
                         clen += 1
                         compresseddeltalen += e[1]
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         if iterrev in chaininfocache:
                             t = chaininfocache[iterrev]
                             clen += t[0]
                             compresseddeltalen += t[1]
                             break
                         e = index[iterrev]
                     else:
                         # Add text length of base since decompressing that also takes
                         # work. For cache hits the length is already included.
                         compresseddeltalen += e[1]
                     r = (clen, compresseddeltalen)
                     chaininfocache[rev] = r
                     return r
                 def _deltachain(self, rev, stoprev=None):
                     """Obtain the delta chain for a revision.
                     ``stoprev`` specifies a revision to stop at. If not specified, we
                     stop at the base of the chain.
                     Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
                     revs in ascending order and ``stopped`` is a bool indicating whether
                     ``stoprev`` was hit.
                     """
                     generaldelta = self.delta_config.general_delta
                     # Try C implementation.
                     try:
                         return self.index.deltachain(rev, stoprev, generaldelta)
                     except AttributeError:
                         pass
                     chain = []
                     # Alias to prevent attribute lookup in tight loop.
                     index = self.index
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != stoprev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == stoprev:
                         stopped = True
                     else:
                         chain.append(iterrev)
                         stopped = False
                     chain.reverse()
                     return chain, stopped
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse revision order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     # first, make sure start revisions aren't filtered
                     revs = list(revs)
                     checkrev = self.node
                     for r in revs:
                         checkrev(r)
                     # and we're sure ancestors aren't filtered as well
                     if rustancestor is not None and self.index.rust_ext_compat:
                         lazyancestors = rustancestor.LazyAncestors
                         arg = self.index
                     else:
                         lazyancestors = ancestor.lazyancestors
                         arg = self._uncheckedparentrevs
                     return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)
                 def descendants(self, revs):
                     return dagop.descendantrevs(revs, self.revs, self.parentrevs)
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset:
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = collections.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(miss) for miss in missing]
                 def incrementalmissingrevs(self, common=None):
                     """Return an object that can be used to incrementally compute the
                     revision numbers of the ancestors of arbitrary sets that are not
                     ancestors of common. This is an ancestor.incrementalmissingancestors
                     object.
                     'common' is a list of revision numbers. If common is not supplied, uses
                     nullrev.
                     """
                     if common is None:
                         common = [nullrev]
                     if rustancestor is not None and self.index.rust_ext_compat:
                         return rustancestor.MissingAncestors(self.index, common)
                     return ancestor.incrementalmissingancestors(self.parentrevs, common)
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     inc = self.incrementalmissingrevs(common=common)
                     return inc.missingancestors(heads)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     inc = self.incrementalmissingrevs(common=common)
                     return [self.node(r) for r in inc.missingancestors(heads)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [self.nullid]  # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return (
                             [self.node(r) for r in self],
                             [self.nullid],
                             list(self.heads()),
                         )
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == self.nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n)  # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update(
                                         [p for p in self.parents(n) if p != self.nullid]
                                     )
                                 elif n in heads:  # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [root for root in roots if root in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(root) for root in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [self.nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [head for head, flag in heads.items() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self, revs=None):
                     if revs is None:
                         try:
                             return self.index.headrevs()
                         except AttributeError:
                             return self._headrevs()
                     if rustdagop is not None and self.index.rust_ext_compat:
                         return rustdagop.headrevs(self.index, revs)
                     return dagop.headrevs(revs, self._uncheckedparentrevs)
                 def computephases(self, roots):
                     return self.index.computephasesmapsets(roots)
                 def _headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     # we won't iter over filtered rev so nobody is a head at start
                     ishead = [0] * (count + 1)
                     index = self.index
                     for r in self:
                         ishead[r] = 1  # I may be an head
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                     return [r for r, val in enumerate(ishead) if val]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [self.nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullrev
                     else:
                         start = self.rev(start)
                     stoprevs = {self.rev(n) for n in stop or []}
                     revs = dagop.headrevssubset(
                         self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs
                     )
                     return [self.node(rev) for rev in revs]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     ancs = self._commonancestorsheads(a, b)
                     return pycompat.maplist(self.node, ancs)
                 def _commonancestorsheads(self, *revs):
                     """calculate all the heads of the common ancestors of revs"""
                     try:
                         ancs = self.index.commonancestorsheads(*revs)
                     except (AttributeError, OverflowError):  # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
                     return ancs
                 def isancestor(self, a, b):
                     """return True if node a is an ancestor of node b
                     A revision is considered an ancestor of itself."""
                     a, b = self.rev(a), self.rev(b)
                     return self.isancestorrev(a, b)
                 def isancestorrev(self, a, b):
                     """return True if revision a is an ancestor of revision b
                     A revision is considered an ancestor of itself.
                     The implementation of this is trivial but the use of
                     reachableroots is not."""
                     if a == nullrev:
                         return True
                     elif a == b:
                         return True
                     elif a > b:
                         return False
                     return bool(self.reachableroots(a, [b], [a], includepath=False))
                 def reachableroots(self, minroot, heads, roots, includepath=False):
                     """return (heads(::(<roots> and <roots>::<heads>)))
                     If includepath is True, return (<roots>::<heads>)."""
                     try:
                         return self.index.reachableroots2(
                             minroot, heads, roots, includepath
                         )
                     except AttributeError:
                         return dagop._reachablerootspure(
                             self.parentrevs, minroot, roots, heads, includepath
                         )
                 def ancestor(self, a, b):
                     """calculate the "best" common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)
                     except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
                         return min(map(self.node, ancs))
                     return self.nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == self.nodeconstants.nodelen:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node)  # quick search the index
                             return node
                         except error.LookupError:
                             pass  # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if b"%d" % rev != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 2 * self.nodeconstants.nodelen:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (binascii.Error, error.LookupError):
                             pass
                 def _partialmatch(self, id):
                     # we don't care wdirfilenodeids as they should be always full hash
                     maybewdir = self.nodeconstants.wdirhex.startswith(id)
                     ambiguous = False
                     try:
                         partial = self.index.partialmatch(id)
                         if partial and self.hasnode(partial):
                             if maybewdir:
                                 # single 'ff...' match in radix tree, ambiguous with wdir
                                 ambiguous = True
                             else:
                                 return partial
                         elif maybewdir:
                             # no 'ff...' match in radix tree, wdir identified
                             raise error.WdirUnsupported
                         else:
                             return None
                     except error.RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fast path: for unfiltered changelog, radix tree is accurate
                         if not getattr(self, 'filteredrevs', None):
                             ambiguous = True
                         # fall through to slow path that filters hidden revisions
                     except (AttributeError, ValueError):
                         # we are pure python, or key is not hex
                         pass
                     if ambiguous:
                         raise error.AmbiguousPrefixLookupError(
                             id, self.display_id, _(b'ambiguous identifier')
                         )
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) <= 40:
                         # hex(node)[:...]
                         l = len(id) // 2 * 2  # grab an even number of digits
                         try:
                             # we're dropping the last digit, so let's check that it's hex,
                             # to avoid the expensive computation below if it's not
                             if len(id) % 2 > 0:
                                 if not (id[-1] in hexdigits):
                                     return None
                             prefix = bin(id[:l])
                         except binascii.Error:
                             pass
                         else:
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [
                                 n for n in nl if hex(n).startswith(id) and self.hasnode(n)
                             ]
                             if self.nodeconstants.nullhex.startswith(id):
                                 nl.append(self.nullid)
                             if len(nl) > 0:
                                 if len(nl) == 1 and not maybewdir:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise error.AmbiguousPrefixLookupError(
                                     id, self.display_id, _(b'ambiguous identifier')
                                 )
                             if maybewdir:
                                 raise error.WdirUnsupported
                             return None
                 def lookup(self, id):
                     """locate a node based on:
                     - revision number or str(revision number)
                     - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise error.LookupError(id, self.display_id, _(b'no match found'))
                 def shortest(self, node, minlength=1):
                     """Find the shortest unambiguous prefix that matches node."""
                     def isvalid(prefix):
                         try:
                             matchednode = self._partialmatch(prefix)
                         except error.AmbiguousPrefixLookupError:
                             return False
                         except error.WdirUnsupported:
                             # single 'ff...' match
                             return True
                         if matchednode is None:
                             raise error.LookupError(node, self.display_id, _(b'no node'))
                         return True
                     def maybewdir(prefix):
                         return all(c == b'f' for c in pycompat.iterbytestr(prefix))
                     hexnode = hex(node)
                     def disambiguate(hexnode, minlength):
                         """Disambiguate against wdirid."""
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if not maybewdir(prefix):
                                 return prefix
                     if not getattr(self, 'filteredrevs', None):
                         try:
                             length = max(self.index.shortest(node), minlength)
                             return disambiguate(hexnode, length)
                         except error.RevlogError:
                             if node != self.nodeconstants.wdirid:
                                 raise error.LookupError(
                                     node, self.display_id, _(b'no node')
                                 )
                         except AttributeError:
                             # Fall through to pure code
                             pass
                     if node == self.nodeconstants.wdirid:
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if isvalid(prefix):
                                 return prefix
                     for length in range(minlength, len(hexnode) + 1):
                         prefix = hexnode[:length]
                         if isvalid(prefix):
                             return disambiguate(hexnode, length)
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return storageutil.hashrevisionsha1(text, p1, p2) != node
                 def _getsegmentforrevs(self, startrev, endrev):
                     """Obtain a segment of raw data corresponding to a range of revisions.
                     Accepts the start and end revisions and an optional already-open
                     file handle to be used for reading. If the file handle is read, its
                     seek position will not be preserved.
                     Requests for data may be satisfied by a cache.
                     Returns a 2-tuple of (offset, data) for the requested range of
                     revisions. Offset is the integer offset from the beginning of the
                     revlog and data is a str or buffer of the raw byte data.
                     Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
                     to determine where each revision's data begins and ends.
                     """
                     # Inlined self.start(startrev) & self.end(endrev) for perf reasons
                     # (functions are expensive).
                     index = self.index
                     istart = index[startrev]
                     start = int(istart[0] >> 16)
                     if startrev == endrev:
                         end = start + istart[1]
                     else:
                         iend = index[endrev]
                         end = int(iend[0] >> 16) + iend[1]
                     if self._inline:
                         start += (startrev + 1) * self.index.entry_size
                         end += (endrev + 1) * self.index.entry_size
                     length = end - start
                     return start, self._segmentfile.read_chunk(start, length)
                 def _chunk(self, rev):
                     """Obtain a single decompressed chunk for a revision.
                     Accepts an integer revision and an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will not
                     be preserved.
                     Returns a str holding uncompressed data for the requested revision.
                     """
                     compression_mode = self.index[rev][10]
                     data = self._getsegmentforrevs(rev, rev)[1]
                     if compression_mode == COMP_MODE_PLAIN:
                         return data
                     elif compression_mode == COMP_MODE_DEFAULT:
                         return self._decompressor(data)
                     elif compression_mode == COMP_MODE_INLINE:
                         return self.decompress(data)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= compression_mode
                         raise error.RevlogError(msg)
                 def _chunks(self, revs, targetsize=None):
                     """Obtain decompressed chunks for the specified revisions.
                     Accepts an iterable of numeric revisions that are assumed to be in
                     ascending order. Also accepts an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will
                     not be preserved.
                     This function is similar to calling ``self._chunk()`` multiple times,
                     but is faster.
                     Returns a list with decompressed data for each requested revision.
                     """
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self._inline
                     iosize = self.index.entry_size
                     buffer = util.buffer
                     l = []
                     ladd = l.append
                     if not self._withsparseread:
                         slicedchunks = (revs,)
                     else:
                         slicedchunks = deltautil.slicechunk(
                             self, revs, targetsize=targetsize
                         )
                     for revschunk in slicedchunks:
                         firstrev = revschunk[0]
                         # Skip trailing revisions with empty diff
                         for lastrev in revschunk[::-1]:
                             if length(lastrev) != 0:
                                 break
                         try:
                             offset, data = self._getsegmentforrevs(firstrev, lastrev)
                         except OverflowError:
                             # issue4215 - we can't cache a run of chunks greater than
                             # 2G on Windows
                             return [self._chunk(rev) for rev in revschunk]
                         decomp = self.decompress
                         # self._decompressor might be None, but will not be used in that case
                         def_decomp = self._decompressor
                         for rev in revschunk:
                             chunkstart = start(rev)
                             if inline:
                                 chunkstart += (rev + 1) * iosize
                             chunklength = length(rev)
                             comp_mode = self.index[rev][10]
                             c = buffer(data, chunkstart - offset, chunklength)
                             if comp_mode == COMP_MODE_PLAIN:
                                 ladd(c)
                             elif comp_mode == COMP_MODE_INLINE:
                                 ladd(decomp(c))
                             elif comp_mode == COMP_MODE_DEFAULT:
                                 ladd(def_decomp(c))
                             else:
                                 msg = b'unknown compression mode %d'
                                 msg %= comp_mode
                                 raise error.RevlogError(msg)
                     return l
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self.delta_config.general_delta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     if not self._sparserevlog:
                         return self.deltaparent(rev) == nullrev
                     elif hasattr(self.index, 'issnapshot'):
                         # directly assign the method to cache the testing and access
                         self.issnapshot = self.index.issnapshot
                         return self.issnapshot(rev)
                     if rev == nullrev:
                         return True
                     entry = self.index[rev]
                     base = entry[3]
                     if base == rev:
                         return True
                     if base == nullrev:
                         return True
                     p1 = entry[5]
                     while self.length(p1) == 0:
                         b = self.deltaparent(p1)
                         if b == p1:
                             break
                         p1 = b
                     p2 = entry[6]
                     while self.length(p2) == 0:
                         b = self.deltaparent(p2)
                         if b == p2:
                             break
                         p2 = b
                     if base == p1 or base == p2:
                         return False
                     return self.issnapshot(base)
                 def snapshotdepth(self, rev):
                     """number of snapshot in the chain before this one"""
                     if not self.issnapshot(rev):
                         raise error.ProgrammingError(b'revision %d not a snapshot')
                     return len(self._deltachain(rev)[0]) - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions
                     The delta calculated is in binary form and is intended to be written to
                     revlog data directly. So this function needs raw revision data.
                     """
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return bytes(self._chunk(rev2))
                     return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))
                 def revision(self, nodeorrev):
                     """return an uncompressed revision of a given node or revision
                     number.
                     """
                     return self._revisiondata(nodeorrev)
                 def sidedata(self, nodeorrev):
                     """a map of extra data related to the changeset but not part of the hash
                     This function currently return a dictionary. However, more advanced
                     mapping object will likely be used in the future for a more
                     efficient/lazy code.
                     """
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                     else:
                         rev = self.rev(nodeorrev)
                     return self._sidedata(rev)
                 def _revisiondata(self, nodeorrev, raw=False):
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     # fast path the special `nullid` rev
                     if node == self.nullid:
                         return b""
                     # ``rawtext`` is the text as stored inside the revlog. Might be the
                     # revision or might need to be processed to retrieve the revision.
                     rev, rawtext, validated = self._rawtext(node, rev)
                     if raw and validated:
                         # if we don't want to process the raw text and that raw
                         # text is cached, we can exit early.
                         return rawtext
                     if rev is None:
                         rev = self.rev(node)
                     # the revlog's flag for this revision
                     # (usually alter its state or content)
                     flags = self.flags(rev)
                     if validated and flags == REVIDX_DEFAULT_FLAGS:
                         # no extra flags set, no flag processor runs, text = rawtext
                         return rawtext
                     if raw:
                         validatehash = flagutil.processflagsraw(self, rawtext, flags)
                         text = rawtext
                     else:
                         r = flagutil.processflagsread(self, rawtext, flags)
                         text, validatehash = r
                     if validatehash:
                         self.checkhash(text, node, rev=rev)
                     if not validated:
                         self._revisioncache = (node, rev, rawtext)
                     return text
                 def _rawtext(self, node, rev):
                     """return the possibly unvalidated rawtext for a revision
                     returns (rev, rawtext, validated)
                     """
                     # revision in the cache (could be useful to apply delta)
                     cachedrev = None
                     # An intermediate text to apply deltas to
                     basetext = None
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._revisioncache:
                         if self._revisioncache[0] == node:
                             return (rev, self._revisioncache[2], True)
                         cachedrev = self._revisioncache[1]
                     if rev is None:
                         rev = self.rev(node)
                     chain, stopped = self._deltachain(rev, stoprev=cachedrev)
                     if stopped:
                         basetext = self._revisioncache[2]
                     # drop cache to save memory, the caller is expected to
                     # update self._revisioncache after validating the text
                     self._revisioncache = None
                     targetsize = None
                     rawsize = self.index[rev][2]
                     if 0 <= rawsize:
                         targetsize = 4 * rawsize
                     bins = self._chunks(chain, targetsize=targetsize)
                     if basetext is None:
                         basetext = bytes(bins[0])
                         bins = bins[1:]
                     rawtext = mdiff.patches(basetext, bins)
                     del basetext  # let us have a chance to free memory early
                     return (rev, rawtext, False)
                 def _sidedata(self, rev):
                     """Return the sidedata for a given revision number."""
                     index_entry = self.index[rev]
                     sidedata_offset = index_entry[8]
                     sidedata_size = index_entry[9]
                     if self._inline:
                         sidedata_offset += self.index.entry_size * (1 + rev)
                     if sidedata_size == 0:
                         return {}
                     if self._docket.sidedata_end < sidedata_offset + sidedata_size:
                         filename = self._sidedatafile
                         end = self._docket.sidedata_end
                         offset = sidedata_offset
                         length = sidedata_size
                         m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)
                         raise error.RevlogError(m)
                     comp_segment = self._segmentfile_sidedata.read_chunk(
                         sidedata_offset, sidedata_size
                     )
                     comp = self.index[rev][11]
                     if comp == COMP_MODE_PLAIN:
                         segment = comp_segment
                     elif comp == COMP_MODE_DEFAULT:
                         segment = self._decompressor(comp_segment)
                     elif comp == COMP_MODE_INLINE:
                         segment = self.decompress(comp_segment)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= comp
                         raise error.RevlogError(msg)
                     sidedata = sidedatautil.deserialize_sidedata(segment)
                     return sidedata
                 def rawdata(self, nodeorrev):
                     """return an uncompressed raw data of a given node or revision number."""
                     return self._revisiondata(nodeorrev, raw=True)
                 def hash(self, text, p1, p2):
                     """Compute a node hash.
                     Available as a function so that subclasses can replace the hash
                     as needed.
                     """
                     return storageutil.hashrevisionsha1(text, p1, p2)
                 def checkhash(self, text, node, p1=None, p2=None, rev=None):
                     """Check node hash integrity.
                     Available as a function so that subclasses can extend hash mismatch
                     behaviors as needed.
                     """
                     try:
                         if p1 is None and p2 is None:
                             p1, p2 = self.parents(node)
                         if node != self.hash(text, p1, p2):
                             # Clear the revision cache on hash failure. The revision cache
                             # only stores the raw revision and clearing the cache does have
                             # the side-effect that we won't have a cache hit when the raw
                             # revision data is accessed. But this case should be rare and
                             # it is extra work to teach the cache about the hash
                             # verification state.
                             if self._revisioncache and self._revisioncache[0] == node:
                                 self._revisioncache = None
                             revornode = rev
                             if revornode is None:
                                 revornode = templatefilters.short(hex(node))
                             raise error.RevlogError(
                                 _(b"integrity check failed on %s:%s")
                                 % (self.display_id, pycompat.bytestr(revornode))
                             )
                     except error.RevlogError:
-                        if self._censorable and storageutil.iscensoredtext(text):
+                        if self.feature_config.censorable and storageutil.iscensoredtext(
+                            text
+                        ):
                             raise error.CensoredNodeError(self.display_id, node, text)
                         raise
                 @property
                 def _split_index_file(self):
                     """the path where to expect the index of an ongoing splitting operation
                     The file will only exist if a splitting operation is in progress, but
                     it is always expected at the same location."""
                     parts = self.radix.split(b'/')
                     if len(parts) > 1:
                         # adds a '-s' prefix to the ``data/` or `meta/` base
                         head = parts[0] + b'-s'
                         mids = parts[1:-1]
                         tail = parts[-1] + b'.i'
                         pieces = [head] + mids + [tail]
                         return b'/'.join(pieces)
                     else:
                         # the revlog is stored at the root of the store (changelog or
                         # manifest), no risk of collision.
                         return self.radix + b'.i.s'
                 def _enforceinlinesize(self, tr, side_write=True):
                     """Check if the revlog is too big for inline and convert if so.
                     This should be called after revisions are added to the revlog. If the
                     revlog has grown too large to be an inline revlog, it will convert it
                     to use multiple index and data files.
                     """
                     tiprev = len(self) - 1
                     total_size = self.start(tiprev) + self.length(tiprev)
                     if not self._inline or total_size < _maxinline:
                         return
                     troffset = tr.findoffset(self._indexfile)
                     if troffset is None:
                         raise error.RevlogError(
                             _(b"%s not found in the transaction") % self._indexfile
                         )
                     if troffset:
                         tr.addbackup(self._indexfile, for_offset=True)
                     tr.add(self._datafile, 0)
                     existing_handles = False
                     if self._writinghandles is not None:
                         existing_handles = True
                         fp = self._writinghandles[0]
                         fp.flush()
                         fp.close()
                         # We can't use the cached file handle after close(). So prevent
                         # its usage.
                         self._writinghandles = None
                         self._segmentfile.writing_handle = None
                         # No need to deal with sidedata writing handle as it is only
                         # relevant with revlog-v2 which is never inline, not reaching
                         # this code
                     if side_write:
                         old_index_file_path = self._indexfile
                         new_index_file_path = self._split_index_file
                         opener = self.opener
                         weak_self = weakref.ref(self)
                         # the "split" index replace the real index when the transaction is finalized
                         def finalize_callback(tr):
                             opener.rename(
                                 new_index_file_path,
                                 old_index_file_path,
                                 checkambig=True,
                             )
                             maybe_self = weak_self()
                             if maybe_self is not None:
                                 maybe_self._indexfile = old_index_file_path
                         def abort_callback(tr):
                             maybe_self = weak_self()
                             if maybe_self is not None:
                                 maybe_self._indexfile = old_index_file_path
                         tr.registertmp(new_index_file_path)
                         if self.target[1] is not None:
                             callback_id = b'000-revlog-split-%d-%s' % self.target
                         else:
                             callback_id = b'000-revlog-split-%d' % self.target[0]
                         tr.addfinalize(callback_id, finalize_callback)
                         tr.addabort(callback_id, abort_callback)
                     new_dfh = self._datafp(b'w+')
                     new_dfh.truncate(0)  # drop any potentially existing data
                     try:
                         with self.reading():
                             for r in self:
                                 new_dfh.write(self._getsegmentforrevs(r, r)[1])
                             new_dfh.flush()
                         if side_write:
                             self._indexfile = new_index_file_path
                         with self.__index_new_fp() as fp:
                             self._format_flags &= ~FLAG_INLINE_DATA
                             self._inline = False
                             for i in self:
                                 e = self.index.entry_binary(i)
                                 if i == 0 and self._docket is None:
                                     header = self._format_flags | self._format_version
                                     header = self.index.pack_header(header)
                                     e = header + e
                                 fp.write(e)
                             if self._docket is not None:
                                 self._docket.index_end = fp.tell()
                             # If we don't use side-write, the temp file replace the real
                             # index when we exit the context manager
                         nodemaputil.setup_persistent_nodemap(tr, self)
                         self._segmentfile = randomaccessfile.randomaccessfile(
                             self.opener,
                             self._datafile,
                             self._chunkcachesize,
                         )
                         if existing_handles:
                             # switched from inline to conventional reopen the index
                             ifh = self.__index_write_fp()
                             self._writinghandles = (ifh, new_dfh, None)
                             self._segmentfile.writing_handle = new_dfh
                             new_dfh = None
                             # No need to deal with sidedata writing handle as it is only
                             # relevant with revlog-v2 which is never inline, not reaching
                             # this code
                     finally:
                         if new_dfh is not None:
                             new_dfh.close()
                 def _nodeduplicatecallback(self, transaction, node):
                     """called when trying to add a node already stored."""
                 @contextlib.contextmanager
                 def reading(self):
                     """Context manager that keeps data and sidedata files open for reading"""
                     if len(self.index) == 0:
                         yield  # nothing to be read
                     else:
                         with self._segmentfile.reading():
                             with self._segmentfile_sidedata.reading():
                                 yield
                 @contextlib.contextmanager
                 def _writing(self, transaction):
                     if self._trypending:
                         msg = b'try to write in a `trypending` revlog: %s'
                         msg %= self.display_id
                         raise error.ProgrammingError(msg)
                     if self._writinghandles is not None:
                         yield
                     else:
                         ifh = dfh = sdfh = None
                         try:
                             r = len(self)
                             # opening the data file.
                             dsize = 0
                             if r:
                                 dsize = self.end(r - 1)
                             dfh = None
                             if not self._inline:
                                 try:
                                     dfh = self._datafp(b"r+")
                                     if self._docket is None:
                                         dfh.seek(0, os.SEEK_END)
                                     else:
                                         dfh.seek(self._docket.data_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     dfh = self._datafp(b"w+")
                                 transaction.add(self._datafile, dsize)
                             if self._sidedatafile is not None:
                                 # revlog-v2 does not inline, help Pytype
                                 assert dfh is not None
                                 try:
                                     sdfh = self.opener(self._sidedatafile, mode=b"r+")
                                     dfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     sdfh = self.opener(self._sidedatafile, mode=b"w+")
                                 transaction.add(
                                     self._sidedatafile, self._docket.sidedata_end
                                 )
                             # opening the index file.
                             isize = r * self.index.entry_size
                             ifh = self.__index_write_fp()
                             if self._inline:
                                 transaction.add(self._indexfile, dsize + isize)
                             else:
                                 transaction.add(self._indexfile, isize)
                             # exposing all file handle for writing.
                             self._writinghandles = (ifh, dfh, sdfh)
                             self._segmentfile.writing_handle = ifh if self._inline else dfh
                             self._segmentfile_sidedata.writing_handle = sdfh
                             yield
                             if self._docket is not None:
                                 self._write_docket(transaction)
                         finally:
                             self._writinghandles = None
                             self._segmentfile.writing_handle = None
                             self._segmentfile_sidedata.writing_handle = None
                             if dfh is not None:
                                 dfh.close()
                             if sdfh is not None:
                                 sdfh.close()
                             # closing the index file last to avoid exposing referent to
                             # potential unflushed data content.
                             if ifh is not None:
                                 ifh.close()
                 def _write_docket(self, transaction):
                     """write the current docket on disk
                     Exist as a method to help changelog to implement transaction logic
                     We could also imagine using the same transaction logic for all revlog
                     since docket are cheap."""
                     self._docket.write(transaction)
                 def addrevision(
                     self,
                     text,
                     transaction,
                     link,
                     p1,
                     p2,
                     cachedelta=None,
                     node=None,
                     flags=REVIDX_DEFAULT_FLAGS,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     flags - the known flags to set on the revision
                     deltacomputer - an optional deltacomputer instance shared between
                         multiple calls
                     """
                     if link == nullrev:
                         raise error.RevlogError(
                             _(b"attempted to add linkrev -1 to %s") % self.display_id
                         )
                     if sidedata is None:
                         sidedata = {}
                     elif sidedata and not self.hassidedata:
                         raise error.ProgrammingError(
                             _(b"trying to add sidedata to a revlog who don't support them")
                         )
                     if flags:
                         node = node or self.hash(text, p1, p2)
                     rawtext, validatehash = flagutil.processflagswrite(self, text, flags)
                     # If the flag processor modifies the revision data, ignore any provided
                     # cachedelta.
                     if rawtext != text:
                         cachedelta = None
                     if len(rawtext) > _maxentrysize:
                         raise error.RevlogError(
                             _(
                                 b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"
                             )
                             % (self.display_id, len(rawtext))
                         )
                     node = node or self.hash(rawtext, p1, p2)
                     rev = self.index.get_rev(node)
                     if rev is not None:
                         return rev
                     if validatehash:
                         self.checkhash(rawtext, node, p1=p1, p2=p2)
                     return self.addrawrevision(
                         rawtext,
                         transaction,
                         link,
                         p1,
                         p2,
                         node,
                         flags,
                         cachedelta=cachedelta,
                         deltacomputer=deltacomputer,
                         sidedata=sidedata,
                     )
                 def addrawrevision(
                     self,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     node,
                     flags,
                     cachedelta=None,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a raw revision with known flags, node and parents
                     useful when reusing a revision not stored in this revlog (ex: received
                     over wire, or read from an external bundle).
                     """
                     with self._writing(transaction):
                         return self._addrevision(
                             node,
                             rawtext,
                             transaction,
                             link,
                             p1,
                             p2,
                             flags,
                             cachedelta,
                             deltacomputer=deltacomputer,
                             sidedata=sidedata,
                         )
                 def compress(self, data):
                     """Generate a possibly-compressed representation of data."""
                     if not data:
                         return b'', data
                     compressed = self._compressor.compress(data)
                     if compressed:
                         # The revlog compressor added the header in the returned data.
                         return b'', compressed
                     if data[0:1] == b'\0':
                         return b'', data
                     return b'u', data
                 def decompress(self, data):
                     """Decompress a revlog chunk.
                     The chunk is expected to begin with a header identifying the
                     format type so it can be routed to an appropriate decompressor.
                     """
                     if not data:
                         return data
                     # Revlogs are read much more frequently than they are written and many
                     # chunks only take microseconds to decompress, so performance is
                     # important here.
                     #
                     # We can make a few assumptions about revlogs:
                     #
                     # 1) the majority of chunks will be compressed (as opposed to inline
                     #    raw data).
                     # 2) decompressing *any* data will likely by at least 10x slower than
                     #    returning raw inline data.
                     # 3) we want to prioritize common and officially supported compression
                     #    engines
                     #
                     # It follows that we want to optimize for "decompress compressed data
                     # when encoded with common and officially supported compression engines"
                     # case over "raw data" and "data encoded by less common or non-official
                     # compression engines." That is why we have the inline lookup first
                     # followed by the compengines lookup.
                     #
                     # According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
                     # compressed chunks. And this matters for changelog and manifest reads.
                     t = data[0:1]
                     if t == b'x':
                         try:
                             return _zlibdecompress(data)
                         except zlib.error as e:
                             raise error.RevlogError(
                                 _(b'revlog decompress error: %s')
                                 % stringutil.forcebytestr(e)
                             )
                     # '\0' is more common than 'u' so it goes first.
                     elif t == b'\0':
                         return data
                     elif t == b'u':
                         return util.buffer(data, 1)
                     compressor = self._get_decompressor(t)
                     return compressor.decompress(data)
                 def _addrevision(
                     self,
                     node,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     flags,
                     cachedelta,
                     alwayscache=False,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
                     if "deltacomputer" is not provided or None, a defaultdeltacomputer will
                     be used.
                     invariants:
                     - rawtext is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     if node == self.nullid:
                         raise error.RevlogError(
                             _(b"%s: attempt to add null revision") % self.display_id
                         )
                     if (
                         node == self.nodeconstants.wdirid
                         or node in self.nodeconstants.wdirfilenodeids
                     ):
                         raise error.RevlogError(
                             _(b"%s: attempt to add wdir revision") % self.display_id
                         )
                     if self._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     btext = [rawtext]
                     curr = len(self)
                     prev = curr - 1
                     offset = self._get_data_offset(prev)
                     if self._concurrencychecker:
                         ifh, dfh, sdfh = self._writinghandles
                         # XXX no checking for the sidedata file
                         if self._inline:
                             # offset is "as if" it were in the .d file, so we need to add on
                             # the size of the entry metadata.
                             self._concurrencychecker(
                                 ifh, self._indexfile, offset + curr * self.index.entry_size
                             )
                         else:
                             # Entries in the .i are a consistent size.
                             self._concurrencychecker(
                                 ifh, self._indexfile, curr * self.index.entry_size
                             )
                             self._concurrencychecker(dfh, self._datafile, offset)
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if rawtext is None:
                         # need rawtext size, before changed by flag processors, which is
                         # the non-raw size. use revlog explicitly to avoid filelog's extra
                         # logic that might remove metadata size.
                         textlen = mdiff.patchedsize(
                             revlog.size(self, cachedelta[0]), cachedelta[1]
                         )
                     else:
                         textlen = len(rawtext)
                     if deltacomputer is None:
                         write_debug = None
                         if self._debug_delta:
                             write_debug = transaction._report
                         deltacomputer = deltautil.deltacomputer(
                             self, write_debug=write_debug
                         )
                     if cachedelta is not None and len(cachedelta) == 2:
                         # If the cached delta has no information about how it should be
                         # reused, add the default reuse instruction according to the
                         # revlog's configuration.
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse = DELTA_BASE_REUSE_NO
                         cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)
                     revinfo = revlogutils.revisioninfo(
                         node,
                         p1,
                         p2,
                         btext,
                         textlen,
                         cachedelta,
                         flags,
                     )
                     deltainfo = deltacomputer.finddeltainfo(revinfo)
                     compression_mode = COMP_MODE_INLINE
                     if self._docket is not None:
                         default_comp = self._docket.default_compression_header
                         r = deltautil.delta_compression(default_comp, deltainfo)
                         compression_mode, deltainfo = r
                     sidedata_compression_mode = COMP_MODE_INLINE
                     if sidedata and self.hassidedata:
                         sidedata_compression_mode = COMP_MODE_PLAIN
                         serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)
                         sidedata_offset = self._docket.sidedata_end
                         h, comp_sidedata = self.compress(serialized_sidedata)
                         if (
                             h != b'u'
                             and comp_sidedata[0:1] != b'\0'
                             and len(comp_sidedata) < len(serialized_sidedata)
                         ):
                             assert not h
                             if (
                                 comp_sidedata[0:1]
                                 == self._docket.default_compression_header
                             ):
                                 sidedata_compression_mode = COMP_MODE_DEFAULT
                                 serialized_sidedata = comp_sidedata
                             else:
                                 sidedata_compression_mode = COMP_MODE_INLINE
                                 serialized_sidedata = comp_sidedata
                     else:
                         serialized_sidedata = b""
                         # Don't store the offset if the sidedata is empty, that way
                         # we can easily detect empty sidedata and they will be no different
                         # than ones we manually add.
                         sidedata_offset = 0
                     rank = RANK_UNKNOWN
                     if self._compute_rank:
                         if (p1r, p2r) == (nullrev, nullrev):
                             rank = 1
                         elif p1r != nullrev and p2r == nullrev:
                             rank = 1 + self.fast_rank(p1r)
                         elif p1r == nullrev and p2r != nullrev:
                             rank = 1 + self.fast_rank(p2r)
                         else:  # merge node
                             if rustdagop is not None and self.index.rust_ext_compat:
                                 rank = rustdagop.rank(self.index, p1r, p2r)
                             else:
                                 pmin, pmax = sorted((p1r, p2r))
                                 rank = 1 + self.fast_rank(pmax)
                                 rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))
                     e = revlogutils.entry(
                         flags=flags,
                         data_offset=offset,
                         data_compressed_length=deltainfo.deltalen,
                         data_uncompressed_length=textlen,
                         data_compression_mode=compression_mode,
                         data_delta_base=deltainfo.base,
                         link_rev=link,
                         parent_rev_1=p1r,
                         parent_rev_2=p2r,
                         node_id=node,
                         sidedata_offset=sidedata_offset,
                         sidedata_compressed_length=len(serialized_sidedata),
                         sidedata_compression_mode=sidedata_compression_mode,
                         rank=rank,
                     )
                     self.index.append(e)
                     entry = self.index.entry_binary(curr)
                     if curr == 0 and self._docket is None:
                         header = self._format_flags | self._format_version
                         header = self.index.pack_header(header)
                         entry = header + entry
                     self._writeentry(
                         transaction,
                         entry,
                         deltainfo.data,
                         link,
                         offset,
                         serialized_sidedata,
                         sidedata_offset,
                     )
                     rawtext = btext[0]
                     if alwayscache and rawtext is None:
                         rawtext = deltacomputer.buildtext(revinfo)
                     if type(rawtext) == bytes:  # only accept immutable objects
                         self._revisioncache = (node, curr, rawtext)
                     self._chainbasecache[curr] = deltainfo.chainbase
                     return curr
                 def _get_data_offset(self, prev):
                     """Returns the current offset in the (in-transaction) data file.
                     Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket
                     file to store that information: since sidedata can be rewritten to the
                     end of the data file within a transaction, you can have cases where, for
                     example, rev `n` does not have sidedata while rev `n - 1` does, leading
                     to `n - 1`'s sidedata being written after `n`'s data.
                     TODO cache this in a docket file before getting out of experimental."""
                     if self._docket is None:
                         return self.end(prev)
                     else:
                         return self._docket.data_end
                 def _writeentry(
                     self, transaction, entry, data, link, offset, sidedata, sidedata_offset
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     if self._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     ifh, dfh, sdfh = self._writinghandles
                     if self._docket is None:
                         ifh.seek(0, os.SEEK_END)
                     else:
                         ifh.seek(self._docket.index_end, os.SEEK_SET)
                     if dfh:
                         if self._docket is None:
                             dfh.seek(0, os.SEEK_END)
                         else:
                             dfh.seek(self._docket.data_end, os.SEEK_SET)
                     if sdfh:
                         sdfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                     curr = len(self) - 1
                     if not self._inline:
                         transaction.add(self._datafile, offset)
                         if self._sidedatafile:
                             transaction.add(self._sidedatafile, sidedata_offset)
                         transaction.add(self._indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         if sidedata:
                             sdfh.write(sidedata)
                         ifh.write(entry)
                     else:
                         offset += curr * self.index.entry_size
                         transaction.add(self._indexfile, offset)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         assert not sidedata
                         self._enforceinlinesize(transaction)
                     if self._docket is not None:
                         # revlog-v2 always has 3 writing handles, help Pytype
                         wh1 = self._writinghandles[0]
                         wh2 = self._writinghandles[1]
                         wh3 = self._writinghandles[2]
                         assert wh1 is not None
                         assert wh2 is not None
                         assert wh3 is not None
                         self._docket.index_end = wh1.tell()
                         self._docket.data_end = wh2.tell()
                         self._docket.sidedata_end = wh3.tell()
                     nodemaputil.setup_persistent_nodemap(transaction, self)
                 def addgroup(
                     self,
                     deltas,
                     linkmapper,
                     transaction,
                     alwayscache=False,
                     addrevisioncb=None,
                     duplicaterevisioncb=None,
                     debug_info=None,
                     delta_base_reuse_policy=None,
                 ):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     If ``addrevisioncb`` is defined, it will be called with arguments of
                     this revlog and the node that was added.
                     """
                     if self._adding_group:
                         raise error.ProgrammingError(b'cannot nest addgroup() calls')
                     # read the default delta-base reuse policy from revlog config if the
                     # group did not specify one.
                     if delta_base_reuse_policy is None:
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse_policy = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse_policy = DELTA_BASE_REUSE_NO
                     self._adding_group = True
                     empty = True
                     try:
                         with self._writing(transaction):
                             write_debug = None
                             if self._debug_delta:
                                 write_debug = transaction._report
                             deltacomputer = deltautil.deltacomputer(
                                 self,
                                 write_debug=write_debug,
                                 debug_info=debug_info,
                             )
                             # loop through our set of deltas
                             for data in deltas:
                                 (
                                     node,
                                     p1,
                                     p2,
                                     linknode,
                                     deltabase,
                                     delta,
                                     flags,
                                     sidedata,
                                 ) = data
                                 link = linkmapper(linknode)
                                 flags = flags or REVIDX_DEFAULT_FLAGS
                                 rev = self.index.get_rev(node)
                                 if rev is not None:
                                     # this can happen if two branches make the same change
                                     self._nodeduplicatecallback(transaction, rev)
                                     if duplicaterevisioncb:
                                         duplicaterevisioncb(self, rev)
                                     empty = False
                                     continue
                                 for p in (p1, p2):
                                     if not self.index.has_node(p):
                                         raise error.LookupError(
                                             p, self.radix, _(b'unknown parent')
                                         )
                                 if not self.index.has_node(deltabase):
                                     raise error.LookupError(
                                         deltabase, self.display_id, _(b'unknown delta base')
                                     )
                                 baserev = self.rev(deltabase)
                                 if baserev != nullrev and self.iscensored(baserev):
                                     # if base is censored, delta must be full replacement in a
                                     # single patch operation
                                     hlen = struct.calcsize(b">lll")
                                     oldlen = self.rawsize(baserev)
                                     newlen = len(delta) - hlen
                                     if delta[:hlen] != mdiff.replacediffheader(
                                         oldlen, newlen
                                     ):
                                         raise error.CensoredBaseError(
                                             self.display_id, self.node(baserev)
                                         )
                                 if not flags and self._peek_iscensored(baserev, delta):
                                     flags |= REVIDX_ISCENSORED
                                 # We assume consumers of addrevisioncb will want to retrieve
                                 # the added revision, which will require a call to
                                 # revision(). revision() will fast path if there is a cache
                                 # hit. So, we tell _addrevision() to always cache in this case.
                                 # We're only using addgroup() in the context of changegroup
                                 # generation so the revision data can always be handled as raw
                                 # by the flagprocessor.
                                 rev = self._addrevision(
                                     node,
                                     None,
                                     transaction,
                                     link,
                                     p1,
                                     p2,
                                     flags,
                                     (baserev, delta, delta_base_reuse_policy),
                                     alwayscache=alwayscache,
                                     deltacomputer=deltacomputer,
                                     sidedata=sidedata,
                                 )
                                 if addrevisioncb:
                                     addrevisioncb(self, rev)
                                 empty = False
                     finally:
                         self._adding_group = False
                     return not empty
                 def iscensored(self, rev):
                     """Check if a file revision is censored."""
-                    if not self._censorable:
+                    if not self.feature_config.censorable:
                         return False
                     return self.flags(rev) & REVIDX_ISCENSORED
                 def _peek_iscensored(self, baserev, delta):
                     """Quickly check if a delta produces a censored revision."""
-                    if not self._censorable:
+                    if not self.feature_config.censorable:
                         return False
                     return storageutil.deltaiscensored(delta, baserev, self.rawsize)
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     return storageutil.resolvestripinfo(
                         minlink,
                         len(self) - 1,
                         self.headrevs(),
                         self.linkrev,
                         self.parentrevs,
                     )
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     data_end = self.start(rev)
                     if not self._inline:
                         transaction.add(self._datafile, data_end)
                         end = rev * self.index.entry_size
                     else:
                         end = data_end + (rev * self.index.entry_size)
                     if self._sidedatafile:
                         sidedata_end = self.sidedata_cut_off(rev)
                         transaction.add(self._sidedatafile, sidedata_end)
                     transaction.add(self._indexfile, end)
                     if self._docket is not None:
                         # XXX we could, leverage the docket while stripping. However it is
                         # not powerfull enough at the time of this comment
                         self._docket.index_end = end
                         self._docket.data_end = data_end
                         self._docket.sidedata_end = sidedata_end
                         self._docket.write(transaction, stripping=True)
                     # then reset internal state in memory to forget those revisions
                     self._revisioncache = None
                     self._chaininfocache = util.lrucachedict(500)
                     self._segmentfile.clear_cache()
                     self._segmentfile_sidedata.clear_cache()
                     del self.index[rev:-1]
                 def checksize(self):
                     """Check size of index and data files
                     return a (dd, di) tuple.
                     - dd: extra bytes for the "data" file
                     - di: extra bytes for the "index" file
                     A healthy revlog will return (0, 0).
                     """
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         with self._datafp() as f:
                             f.seek(0, io.SEEK_END)
                             actual = f.tell()
                         dd = actual - expected
                     except FileNotFoundError:
                         dd = 0
                     try:
                         f = self.opener(self._indexfile)
                         f.seek(0, io.SEEK_END)
                         actual = f.tell()
                         f.close()
                         s = self.index.entry_size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except FileNotFoundError:
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self._indexfile]
                     if self._docket_file is None:
                         if not self._inline:
                             res.append(self._datafile)
                     else:
                         res.append(self._docket_file)
                         res.extend(self._docket.old_index_filepaths(include_empty=False))
                         if self._docket.data_end:
                             res.append(self._datafile)
                         res.extend(self._docket.old_data_filepaths(include_empty=False))
                         if self._docket.sidedata_end:
                             res.append(self._sidedatafile)
                         res.extend(self._docket.old_sidedata_filepaths(include_empty=False))
                     return res
                 def emitrevisions(
                     self,
                     nodes,
                     nodesorder=None,
                     revisiondata=False,
                     assumehaveparentrevisions=False,
                     deltamode=repository.CG_DELTAMODE_STD,
                     sidedata_helpers=None,
                     debug_info=None,
                 ):
                     if nodesorder not in (b'nodes', b'storage', b'linear', None):
                         raise error.ProgrammingError(
                             b'unhandled value for nodesorder: %s' % nodesorder
                         )
                     if nodesorder is None and not self.delta_config.general_delta:
                         nodesorder = b'storage'
                     if (
                         not self._storedeltachains
                         and deltamode != repository.CG_DELTAMODE_PREV
                     ):
                         deltamode = repository.CG_DELTAMODE_FULL
                     return storageutil.emitrevisions(
                         self,
                         nodes,
                         nodesorder,
                         revlogrevisiondelta,
                         deltaparentfn=self.deltaparent,
                         candeltafn=self._candelta,
                         rawsizefn=self.rawsize,
                         revdifffn=self.revdiff,
                         flagsfn=self.flags,
                         deltamode=deltamode,
                         revisiondata=revisiondata,
                         assumehaveparentrevisions=assumehaveparentrevisions,
                         sidedata_helpers=sidedata_helpers,
                         debug_info=debug_info,
                     )
                 DELTAREUSEALWAYS = b'always'
                 DELTAREUSESAMEREVS = b'samerevs'
                 DELTAREUSENEVER = b'never'
                 DELTAREUSEFULLADD = b'fulladd'
                 DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}
                 def clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb=None,
                     deltareuse=DELTAREUSESAMEREVS,
                     forcedeltabothparents=None,
                     sidedata_helpers=None,
                 ):
                     """Copy this revlog to another, possibly with format changes.
                     The destination revlog will contain the same revisions and nodes.
                     However, it may not be bit-for-bit identical due to e.g. delta encoding
                     differences.
                     The ``deltareuse`` argument control how deltas from the existing revlog
                     are preserved in the destination revlog. The argument can have the
                     following values:
                     DELTAREUSEALWAYS
                        Deltas will always be reused (if possible), even if the destination
                        revlog would not select the same revisions for the delta. This is the
                        fastest mode of operation.
                     DELTAREUSESAMEREVS
                        Deltas will be reused if the destination revlog would pick the same
                        revisions for the delta. This mode strikes a balance between speed
                        and optimization.
                     DELTAREUSENEVER
                        Deltas will never be reused. This is the slowest mode of execution.
                        This mode can be used to recompute deltas (e.g. if the diff/delta
                        algorithm changes).
                     DELTAREUSEFULLADD
                        Revision will be re-added as if their were new content. This is
                        slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.
                        eg: large file detection and handling.
                     Delta computation can be slow, so the choice of delta reuse policy can
                     significantly affect run time.
                     The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
                     two extremes. Deltas will be reused if they are appropriate. But if the
                     delta could choose a better revision, it will do so. This means if you
                     are converting a non-generaldelta revlog to a generaldelta revlog,
                     deltas will be recomputed if the delta's parent isn't a parent of the
                     revision.
                     In addition to the delta policy, the ``forcedeltabothparents``
                     argument controls whether to force compute deltas against both parents
                     for merges. By default, the current default is used.
                     See `revlogutil.sidedata.get_sidedata_helpers` for the doc on
                     `sidedata_helpers`.
                     """
                     if deltareuse not in self.DELTAREUSEALL:
                         raise ValueError(
                             _(b'value for deltareuse invalid: %s') % deltareuse
                         )
                     if len(destrevlog):
                         raise ValueError(_(b'destination revlog is not empty'))
                     if getattr(self, 'filteredrevs', None):
                         raise ValueError(_(b'source revlog has filtered revisions'))
                     if getattr(destrevlog, 'filteredrevs', None):
                         raise ValueError(_(b'destination revlog has filtered revisions'))
                     # lazydelta and lazydeltabase controls whether to reuse a cached delta,
                     # if possible.
                     old_delta_config = destrevlog.delta_config
                     destrevlog.delta_config = destrevlog.delta_config.copy()
                     try:
                         if deltareuse == self.DELTAREUSEALWAYS:
                             destrevlog.delta_config.lazy_delta_base = True
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSESAMEREVS:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSENEVER:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = False
                         delta_both_parents = (
                             forcedeltabothparents or old_delta_config.delta_both_parents
                         )
                         destrevlog.delta_config.delta_both_parents = delta_both_parents
                         with self.reading():
                             self._clone(
                                 tr,
                                 destrevlog,
                                 addrevisioncb,
                                 deltareuse,
                                 forcedeltabothparents,
                                 sidedata_helpers,
                             )
                     finally:
                         destrevlog.delta_config = old_delta_config
                 def _clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb,
                     deltareuse,
                     forcedeltabothparents,
                     sidedata_helpers,
                 ):
                     """perform the core duty of `revlog.clone` after parameter processing"""
                     write_debug = None
                     if self._debug_delta:
                         write_debug = tr._report
                     deltacomputer = deltautil.deltacomputer(
                         destrevlog,
                         write_debug=write_debug,
                     )
                     index = self.index
                     for rev in self:
                         entry = index[rev]
                         # Some classes override linkrev to take filtered revs into
                         # account. Use raw entry from index.
                         flags = entry[0] & 0xFFFF
                         linkrev = entry[4]
                         p1 = index[entry[5]][7]
                         p2 = index[entry[6]][7]
                         node = entry[7]
                         # (Possibly) reuse the delta from the revlog if allowed and
                         # the revlog chunk is a delta.
                         cachedelta = None
                         rawtext = None
                         if deltareuse == self.DELTAREUSEFULLADD:
                             text = self._revisiondata(rev)
                             sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             destrevlog.addrevision(
                                 text,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 cachedelta=cachedelta,
                                 node=node,
                                 flags=flags,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         else:
                             if destrevlog._lazydelta:
                                 dp = self.deltaparent(rev)
                                 if dp != nullrev:
                                     cachedelta = (dp, bytes(self._chunk(rev)))
                             sidedata = None
                             if not cachedelta:
                                 rawtext = self._revisiondata(rev)
                                 sidedata = self.sidedata(rev)
                             if sidedata is None:
                                 sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             with destrevlog._writing(tr):
                                 destrevlog._addrevision(
                                     node,
                                     rawtext,
                                     tr,
                                     linkrev,
                                     p1,
                                     p2,
                                     flags,
                                     cachedelta,
                                     deltacomputer=deltacomputer,
                                     sidedata=sidedata,
                                 )
                         if addrevisioncb:
                             addrevisioncb(self, rev, node)
                 def censorrevision(self, tr, censornode, tombstone=b''):
                     if self._format_version == REVLOGV0:
                         raise error.RevlogError(
                             _(b'cannot censor with version %d revlogs')
                             % self._format_version
                         )
                     elif self._format_version == REVLOGV1:
                         rewrite.v1_censor(self, tr, censornode, tombstone)
                     else:
                         rewrite.v2_censor(self, tr, censornode, tombstone)
                 def verifyintegrity(self, state):
                     """Verifies the integrity of the revlog.
                     Yields ``revlogproblem`` instances describing problems that are
                     found.
                     """
                     dd, di = self.checksize()
                     if dd:
                         yield revlogproblem(error=_(b'data length off by %d bytes') % dd)
                     if di:
                         yield revlogproblem(error=_(b'index contains %d extra bytes') % di)
                     version = self._format_version
                     # The verifier tells us what version revlog we should be.
                     if version != state[b'expectedversion']:
                         yield revlogproblem(
                             warning=_(b"warning: '%s' uses revlog format %d; expected %d")
                             % (self.display_id, version, state[b'expectedversion'])
                         )
                     state[b'skipread'] = set()
                     state[b'safe_renamed'] = set()
                     for rev in self:
                         node = self.node(rev)
                         # Verify contents. 4 cases to care about:
                         #
                         #   common: the most common case
                         #   rename: with a rename
                         #   meta: file content starts with b'\1\n', the metadata
                         #         header defined in filelog.py, but without a rename
                         #   ext: content stored externally
                         #
                         # More formally, their differences are shown below:
                         #
                         #                       | common | rename | meta  | ext
                         #  -------------------------------------------------------
                         #   flags()             | 0      | 0      | 0     | not 0
                         #   renamed()           | False  | True   | False | ?
                         #   rawtext[0:2]=='\1\n'| False  | True   | True  | ?
                         #
                         # "rawtext" means the raw text stored in revlog data, which
                         # could be retrieved by "rawdata(rev)". "text"
                         # mentioned below is "revision(rev)".
                         #
                         # There are 3 different lengths stored physically:
                         #  1. L1: rawsize, stored in revlog index
                         #  2. L2: len(rawtext), stored in revlog data
                         #  3. L3: len(text), stored in revlog data if flags==0, or
                         #     possibly somewhere else if flags!=0
                         #
                         # L1 should be equal to L2. L3 could be different from them.
                         # "text" may or may not affect commit hash depending on flag
                         # processors (see flagutil.addflagprocessor).
                         #
                         #              | common  | rename | meta  | ext
                         # -------------------------------------------------
                         #    rawsize() | L1      | L1     | L1    | L1
                         #       size() | L1      | L2-LM  | L1(*) | L1 (?)
                         # len(rawtext) | L2      | L2     | L2    | L2
                         #    len(text) | L2      | L2     | L2    | L3
                         #  len(read()) | L2      | L2-LM  | L2-LM | L3 (?)
                         #
                         # LM:  length of metadata, depending on rawtext
                         # (*): not ideal, see comment in filelog.size
                         # (?): could be "- len(meta)" if the resolved content has
                         #      rename metadata
                         #
                         # Checks needed to be done:
                         #  1. length check: L1 == L2, in all cases.
                         #  2. hash check: depending on flag processor, we may need to
                         #     use either "text" (external), or "rawtext" (in revlog).
                         try:
                             skipflags = state.get(b'skipflags', 0)
                             if skipflags:
                                 skipflags &= self.flags(rev)
                             _verify_revision(self, skipflags, state, node)
                             l1 = self.rawsize(rev)
                             l2 = len(self.rawdata(node))
                             if l1 != l2:
                                 yield revlogproblem(
                                     error=_(b'unpacked size is %d, %d expected') % (l2, l1),
                                     node=node,
                                 )
                         except error.CensoredNodeError:
                             if state[b'erroroncensored']:
                                 yield revlogproblem(
                                     error=_(b'censored file data'), node=node
                                 )
                                 state[b'skipread'].add(node)
                         except Exception as e:
                             yield revlogproblem(
                                 error=_(b'unpacking %s: %s')
                                 % (short(node), stringutil.forcebytestr(e)),
                                 node=node,
                             )
                             state[b'skipread'].add(node)
                 def storageinfo(
                     self,
                     exclusivefiles=False,
                     sharedfiles=False,
                     revisionscount=False,
                     trackedsize=False,
                     storedsize=False,
                 ):
                     d = {}
                     if exclusivefiles:
                         d[b'exclusivefiles'] = [(self.opener, self._indexfile)]
                         if not self._inline:
                             d[b'exclusivefiles'].append((self.opener, self._datafile))
                     if sharedfiles:
                         d[b'sharedfiles'] = []
                     if revisionscount:
                         d[b'revisionscount'] = len(self)
                     if trackedsize:
                         d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))
                     if storedsize:
                         d[b'storedsize'] = sum(
                             self.opener.stat(path).st_size for path in self.files()
                         )
                     return d
                 def rewrite_sidedata(self, transaction, helpers, startrev, endrev):
                     if not self.hassidedata:
                         return
                     # revlog formats with sidedata support does not support inline
                     assert not self._inline
                     if not helpers[1] and not helpers[2]:
                         # Nothing to generate or remove
                         return
                     new_entries = []
                     # append the new sidedata
                     with self._writing(transaction):
                         ifh, dfh, sdfh = self._writinghandles
                         dfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                         current_offset = sdfh.tell()
                         for rev in range(startrev, endrev + 1):
                             entry = self.index[rev]
                             new_sidedata, flags = sidedatautil.run_sidedata_helpers(
                                 store=self,
                                 sidedata_helpers=helpers,
                                 sidedata={},
                                 rev=rev,
                             )
                             serialized_sidedata = sidedatautil.serialize_sidedata(
                                 new_sidedata
                             )
                             sidedata_compression_mode = COMP_MODE_INLINE
                             if serialized_sidedata and self.hassidedata:
                                 sidedata_compression_mode = COMP_MODE_PLAIN
                                 h, comp_sidedata = self.compress(serialized_sidedata)
                                 if (
                                     h != b'u'
                                     and comp_sidedata[0] != b'\0'
                                     and len(comp_sidedata) < len(serialized_sidedata)
                                 ):
                                     assert not h
                                     if (
                                         comp_sidedata[0]
                                         == self._docket.default_compression_header
                                     ):
                                         sidedata_compression_mode = COMP_MODE_DEFAULT
                                         serialized_sidedata = comp_sidedata
                                     else:
                                         sidedata_compression_mode = COMP_MODE_INLINE
                                         serialized_sidedata = comp_sidedata
                             if entry[8] != 0 or entry[9] != 0:
                                 # rewriting entries that already have sidedata is not
                                 # supported yet, because it introduces garbage data in the
                                 # revlog.
                                 msg = b"rewriting existing sidedata is not supported yet"
                                 raise error.Abort(msg)
                             # Apply (potential) flags to add and to remove after running
                             # the sidedata helpers
                             new_offset_flags = entry[0] | flags[0] & ~flags[1]
                             entry_update = (
                                 current_offset,
                                 len(serialized_sidedata),
                                 new_offset_flags,
                                 sidedata_compression_mode,
                             )
                             # the sidedata computation might have move the file cursors around
                             sdfh.seek(current_offset, os.SEEK_SET)
                             sdfh.write(serialized_sidedata)
                             new_entries.append(entry_update)
                             current_offset += len(serialized_sidedata)
                             self._docket.sidedata_end = sdfh.tell()
                         # rewrite the new index entries
                         ifh.seek(startrev * self.index.entry_size)
                         for i, e in enumerate(new_entries):
                             rev = startrev + i
                             self.index.replace_sidedata_info(rev, *e)
                             packed = self.index.entry_binary(rev)
                             if rev == 0 and self._docket is None:
                                 header = self._format_flags | self._format_version
                                 header = self.index.pack_header(header)
                                 packed = header + packed
                             ifh.write(packed)