upstream/mercurial-mirror Commit - r51957:81f38773

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

# coding: utf8

2

# coding: utf8

3

#

3

#

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

"""Storage back-end for Mercurial.

9

"""Storage back-end for Mercurial.

10

11

This provides efficient delta storage with O(1) retrieve and append

11

This provides efficient delta storage with O(1) retrieve and append

12

and O(changes) merge between branches.

12

and O(changes) merge between branches.

13

"""

13

"""

14

15

16

import binascii

16

import binascii

17

import collections

17

import collections

18

import contextlib

18

import contextlib

19

import io

19

import io

20

import os

20

import os

21

import struct

21

import struct

22

import weakref

22

import weakref

23

import zlib

23

import zlib

24

25

# import stuff from node for others to import from revlog

25

# import stuff from node for others to import from revlog

26

from .node import (

26

from .node import (

27

bin,

27

bin,

28

hex,

28

hex,

29

nullrev,

29

nullrev,

30

sha1nodeconstants,

30

sha1nodeconstants,

31

short,

31

short,

32

wdirrev,

32

wdirrev,

33

)

33

)

34

from .i18n import _

34

from .i18n import _

35

from .revlogutils.constants import (

35

from .revlogutils.constants import (

36

ALL_KINDS,

36

ALL_KINDS,

37

CHANGELOGV2,

37

CHANGELOGV2,

38

COMP_MODE_DEFAULT,

38

COMP_MODE_DEFAULT,

39

COMP_MODE_INLINE,

39

COMP_MODE_INLINE,

40

COMP_MODE_PLAIN,

40

COMP_MODE_PLAIN,

41

DELTA_BASE_REUSE_NO,

41

DELTA_BASE_REUSE_NO,

42

DELTA_BASE_REUSE_TRY,

42

DELTA_BASE_REUSE_TRY,

43

ENTRY_RANK,

43

ENTRY_RANK,

44

FEATURES_BY_VERSION,

44

FEATURES_BY_VERSION,

45

FLAG_GENERALDELTA,

45

FLAG_GENERALDELTA,

46

FLAG_INLINE_DATA,

46

FLAG_INLINE_DATA,

47

INDEX_HEADER,

47

INDEX_HEADER,

48

KIND_CHANGELOG,

48

KIND_CHANGELOG,

49

KIND_FILELOG,

49

KIND_FILELOG,

50

RANK_UNKNOWN,

50

RANK_UNKNOWN,

51

REVLOGV0,

51

REVLOGV0,

52

REVLOGV1,

52

REVLOGV1,

53

REVLOGV1_FLAGS,

53

REVLOGV1_FLAGS,

54

REVLOGV2,

54

REVLOGV2,

55

REVLOGV2_FLAGS,

55

REVLOGV2_FLAGS,

56

REVLOG_DEFAULT_FLAGS,

56

REVLOG_DEFAULT_FLAGS,

57

REVLOG_DEFAULT_FORMAT,

57

REVLOG_DEFAULT_FORMAT,

58

REVLOG_DEFAULT_VERSION,

58

REVLOG_DEFAULT_VERSION,

59

SUPPORTED_FLAGS,

59

SUPPORTED_FLAGS,

60

)

60

)

61

from .revlogutils.flagutil import (

61

from .revlogutils.flagutil import (

62

REVIDX_DEFAULT_FLAGS,

62

REVIDX_DEFAULT_FLAGS,

63

REVIDX_ELLIPSIS,

63

REVIDX_ELLIPSIS,

64

REVIDX_EXTSTORED,

64

REVIDX_EXTSTORED,

65

REVIDX_FLAGS_ORDER,

65

REVIDX_FLAGS_ORDER,

66

REVIDX_HASCOPIESINFO,

66

REVIDX_HASCOPIESINFO,

67

REVIDX_ISCENSORED,

67

REVIDX_ISCENSORED,

68

REVIDX_RAWTEXT_CHANGING_FLAGS,

68

REVIDX_RAWTEXT_CHANGING_FLAGS,

69

)

69

)

70

from .thirdparty import attr

70

from .thirdparty import attr

71

from . import (

71

from . import (

72

ancestor,

72

ancestor,

73

dagop,

73

dagop,

74

error,

74

error,

75

mdiff,

75

mdiff,

76

policy,

76

policy,

77

pycompat,

77

pycompat,

78

revlogutils,

78

revlogutils,

79

templatefilters,

79

templatefilters,

80

util,

80

util,

81

)

81

)

82

from .interfaces import (

82

from .interfaces import (

83

repository,

83

repository,

84

util as interfaceutil,

84

util as interfaceutil,

85

)

85

)

86

from .revlogutils import (

86

from .revlogutils import (

87

deltas as deltautil,

87

deltas as deltautil,

88

docket as docketutil,

88

docket as docketutil,

89

flagutil,

89

flagutil,

90

nodemap as nodemaputil,

90

nodemap as nodemaputil,

91

randomaccessfile,

91

randomaccessfile,

92

revlogv0,

92

revlogv0,

93

rewrite,

93

rewrite,

94

sidedata as sidedatautil,

94

sidedata as sidedatautil,

95

)

95

)

96

from .utils import (

96

from .utils import (

97

storageutil,

97

storageutil,

98

stringutil,

98

stringutil,

99

)

99

)

100

101

# blanked usage of all the name to prevent pyflakes constraints

101

# blanked usage of all the name to prevent pyflakes constraints

102

# We need these name available in the module for extensions.

102

# We need these name available in the module for extensions.

103

104

REVLOGV0

104

REVLOGV0

105

REVLOGV1

105

REVLOGV1

106

REVLOGV2

106

REVLOGV2

107

CHANGELOGV2

107

CHANGELOGV2

108

FLAG_INLINE_DATA

108

FLAG_INLINE_DATA

109

FLAG_GENERALDELTA

109

FLAG_GENERALDELTA

110

REVLOG_DEFAULT_FLAGS

110

REVLOG_DEFAULT_FLAGS

111

REVLOG_DEFAULT_FORMAT

111

REVLOG_DEFAULT_FORMAT

112

REVLOG_DEFAULT_VERSION

112

REVLOG_DEFAULT_VERSION

113

REVLOGV1_FLAGS

113

REVLOGV1_FLAGS

114

REVLOGV2_FLAGS

114

REVLOGV2_FLAGS

115

REVIDX_ISCENSORED

115

REVIDX_ISCENSORED

116

REVIDX_ELLIPSIS

116

REVIDX_ELLIPSIS

117

REVIDX_HASCOPIESINFO

117

REVIDX_HASCOPIESINFO

118

REVIDX_EXTSTORED

118

REVIDX_EXTSTORED

119

REVIDX_DEFAULT_FLAGS

119

REVIDX_DEFAULT_FLAGS

120

REVIDX_FLAGS_ORDER

120

REVIDX_FLAGS_ORDER

121

REVIDX_RAWTEXT_CHANGING_FLAGS

121

REVIDX_RAWTEXT_CHANGING_FLAGS

122

123

parsers = policy.importmod('parsers')

123

parsers = policy.importmod('parsers')

124

rustancestor = policy.importrust('ancestor')

124

rustancestor = policy.importrust('ancestor')

125

rustdagop = policy.importrust('dagop')

125

rustdagop = policy.importrust('dagop')

126

rustrevlog = policy.importrust('revlog')

126

rustrevlog = policy.importrust('revlog')

127

128

# Aliased for performance.

128

# Aliased for performance.

129

_zlibdecompress = zlib.decompress

129

_zlibdecompress = zlib.decompress

130

131

# max size of inline data embedded into a revlog

131

# max size of inline data embedded into a revlog

132

_maxinline = 131072

132

_maxinline = 131072

133

134

# Flag processors for REVIDX_ELLIPSIS.

134

# Flag processors for REVIDX_ELLIPSIS.

135

def ellipsisreadprocessor(rl, text):

135

def ellipsisreadprocessor(rl, text):

136

return text, False

136

return text, False

137

138

139

def ellipsiswriteprocessor(rl, text):

139

def ellipsiswriteprocessor(rl, text):

140

return text, False

140

return text, False

141

142

143

def ellipsisrawprocessor(rl, text):

143

def ellipsisrawprocessor(rl, text):

144

return False

144

return False

145

146

147

ellipsisprocessor = (

147

ellipsisprocessor = (

148

ellipsisreadprocessor,

148

ellipsisreadprocessor,

149

ellipsiswriteprocessor,

149

ellipsiswriteprocessor,

150

ellipsisrawprocessor,

150

ellipsisrawprocessor,

151

)

151

)

152

153

154

def _verify_revision(rl, skipflags, state, node):

154

def _verify_revision(rl, skipflags, state, node):

155

"""Verify the integrity of the given revlog ``node`` while providing a hook

155

"""Verify the integrity of the given revlog ``node`` while providing a hook

156

point for extensions to influence the operation."""

156

point for extensions to influence the operation."""

157

if skipflags:

157

if skipflags:

158

state[b'skipread'].add(node)

158

state[b'skipread'].add(node)

159

else:

159

else:

160

# Side-effect: read content and verify hash.

160

# Side-effect: read content and verify hash.

161

rl.revision(node)

161

rl.revision(node)

162

163

164

# True if a fast implementation for persistent-nodemap is available

164

# True if a fast implementation for persistent-nodemap is available

165

#

165

#

166

# We also consider we have a "fast" implementation in "pure" python because

166

# We also consider we have a "fast" implementation in "pure" python because

167

# people using pure don't really have performance consideration (and a

167

# people using pure don't really have performance consideration (and a

168

# wheelbarrow of other slowness source)

168

# wheelbarrow of other slowness source)

169

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

169

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

170

parsers, 'BaseIndexObject'

170

parsers, 'BaseIndexObject'

171

)

171

)

172

173

174

@interfaceutil.implementer(repository.irevisiondelta)

174

@interfaceutil.implementer(repository.irevisiondelta)

175

@attr.s(slots=True)

175

@attr.s(slots=True)

176

class revlogrevisiondelta:

176

class revlogrevisiondelta:

177

node = attr.ib()

177

node = attr.ib()

178

p1node = attr.ib()

178

p1node = attr.ib()

179

p2node = attr.ib()

179

p2node = attr.ib()

180

basenode = attr.ib()

180

basenode = attr.ib()

181

flags = attr.ib()

181

flags = attr.ib()

182

baserevisionsize = attr.ib()

182

baserevisionsize = attr.ib()

183

revision = attr.ib()

183

revision = attr.ib()

184

delta = attr.ib()

184

delta = attr.ib()

185

sidedata = attr.ib()

185

sidedata = attr.ib()

186

protocol_flags = attr.ib()

186

protocol_flags = attr.ib()

187

linknode = attr.ib(default=None)

187

linknode = attr.ib(default=None)

188

189

190

@interfaceutil.implementer(repository.iverifyproblem)

190

@interfaceutil.implementer(repository.iverifyproblem)

191

@attr.s(frozen=True)

191

@attr.s(frozen=True)

192

class revlogproblem:

192

class revlogproblem:

193

warning = attr.ib(default=None)

193

warning = attr.ib(default=None)

194

error = attr.ib(default=None)

194

error = attr.ib(default=None)

195

node = attr.ib(default=None)

195

node = attr.ib(default=None)

196

197

198

def parse_index_v1(data, inline):

198

def parse_index_v1(data, inline):

199

# call the C implementation to parse the index data

199

# call the C implementation to parse the index data

200

index, cache = parsers.parse_index2(data, inline)

200

index, cache = parsers.parse_index2(data, inline)

201

return index, cache

201

return index, cache

202

203

204

def parse_index_v2(data, inline):

204

def parse_index_v2(data, inline):

205

# call the C implementation to parse the index data

205

# call the C implementation to parse the index data

206

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

206

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

207

return index, cache

207

return index, cache

208

209

210

def parse_index_cl_v2(data, inline):

210

def parse_index_cl_v2(data, inline):

211

# call the C implementation to parse the index data

211

# call the C implementation to parse the index data

212

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

212

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

213

return index, cache

213

return index, cache

214

215

216

if hasattr(parsers, 'parse_index_devel_nodemap'):

216

if hasattr(parsers, 'parse_index_devel_nodemap'):

217

218

def parse_index_v1_nodemap(data, inline):

218

def parse_index_v1_nodemap(data, inline):

219

index, cache = parsers.parse_index_devel_nodemap(data, inline)

219

index, cache = parsers.parse_index_devel_nodemap(data, inline)

220

return index, cache

220

return index, cache

221

222

223

else:

223

else:

224

parse_index_v1_nodemap = None

224

parse_index_v1_nodemap = None

225

226

227

def parse_index_v1_mixed(data, inline):

227

def parse_index_v1_mixed(data, inline):

228

index, cache = parse_index_v1(data, inline)

228

index, cache = parse_index_v1(data, inline)

229

return rustrevlog.MixedIndex(index), cache

229

return rustrevlog.MixedIndex(index), cache

230

231

232

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

232

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

233

# signed integer)

233

# signed integer)

234

_maxentrysize = 0x7FFFFFFF

234

_maxentrysize = 0x7FFFFFFF

235

236

FILE_TOO_SHORT_MSG = _(

236

FILE_TOO_SHORT_MSG = _(

237

b'cannot read from revlog %s;'

237

b'cannot read from revlog %s;'

238

b' expected %d bytes from offset %d, data size is %d'

238

b' expected %d bytes from offset %d, data size is %d'

239

)

239

)

240

241

hexdigits = b'0123456789abcdefABCDEF'

241

hexdigits = b'0123456789abcdefABCDEF'

242

243

244

class _Config:

244

class _Config:

245

def copy(self):

245

def copy(self):

246

return self.__class__(**self.__dict__)

246

return self.__class__(**self.__dict__)

247

248

249

@attr.s()

249

@attr.s()

250

class FeatureConfig(_Config):

250

class FeatureConfig(_Config):

251

"""Hold configuration values about the available revlog features"""

251

"""Hold configuration values about the available revlog features"""

252

253

# the default compression engine

253

# the default compression engine

254

compression_engine = attr.ib(default=b'zlib')

254

compression_engine = attr.ib(default=b'zlib')

255

# compression engines options

255

# compression engines options

256

compression_engine_options = attr.ib(default=attr.Factory(dict))

256

compression_engine_options = attr.ib(default=attr.Factory(dict))

257

258

# can we use censor on this revlog

258

# can we use censor on this revlog

259

censorable = attr.ib(default=False)

259

censorable = attr.ib(default=False)

260

# does this revlog use the "side data" feature

260

# does this revlog use the "side data" feature

261

has_side_data = attr.ib(default=False)

261

has_side_data = attr.ib(default=False)

262

# might remove rank configuration once the computation has no impact

262

# might remove rank configuration once the computation has no impact

263

compute_rank = attr.ib(default=False)

263

compute_rank = attr.ib(default=False)

264

# parent order is supposed to be semantically irrelevant, so we

264

# parent order is supposed to be semantically irrelevant, so we

265

# normally resort parents to ensure that the first parent is non-null,

265

# normally resort parents to ensure that the first parent is non-null,

266

# if there is a non-null parent at all.

266

# if there is a non-null parent at all.

267

# filelog abuses the parent order as flag to mark some instances of

267

# filelog abuses the parent order as flag to mark some instances of

268

# meta-encoded files, so allow it to disable this behavior.

268

# meta-encoded files, so allow it to disable this behavior.

269

canonical_parent_order = attr.ib(default=False)

269

canonical_parent_order = attr.ib(default=False)

270

# can ellipsis commit be used

270

# can ellipsis commit be used

271

enable_ellipsis = attr.ib(default=False)

271

enable_ellipsis = attr.ib(default=False)

272

273

def copy(self):

273

def copy(self):

274

new = super().copy()

274

new = super().copy()

275

new.compression_engine_options = self.compression_engine_options.copy()

275

new.compression_engine_options = self.compression_engine_options.copy()

276

return new

276

return new

277

278

279

@attr.s()

279

@attr.s()

280

class DataConfig(_Config):

280

class DataConfig(_Config):

281

"""Hold configuration value about how the revlog data are read"""

281

"""Hold configuration value about how the revlog data are read"""

282

283

# should we try to open the "pending" version of the revlog

283

# should we try to open the "pending" version of the revlog

284

try_pending = attr.ib(default=False)

284

try_pending = attr.ib(default=False)

285

# should we try to open the "splitted" version of the revlog

285

# should we try to open the "splitted" version of the revlog

286

try_split = attr.ib(default=False)

286

try_split = attr.ib(default=False)

287

# When True, indexfile should be opened with checkambig=True at writing,

287

# When True, indexfile should be opened with checkambig=True at writing,

288

# to avoid file stat ambiguity.

288

# to avoid file stat ambiguity.

289

check_ambig = attr.ib(default=False)

289

check_ambig = attr.ib(default=False)

290

291

# If true, use mmap instead of reading to deal with large index

291

# If true, use mmap instead of reading to deal with large index

292

mmap_large_index = attr.ib(default=False)

292

mmap_large_index = attr.ib(default=False)

293

# how much data is large

293

# how much data is large

294

mmap_index_threshold = attr.ib(default=None)

294

mmap_index_threshold = attr.ib(default=None)

295

# How much data to read and cache into the raw revlog data cache.

295

# How much data to read and cache into the raw revlog data cache.

296

chunk_cache_size = attr.ib(default=65536)

296

chunk_cache_size = attr.ib(default=65536)

297

298

# Allow sparse reading of the revlog data

298

# Allow sparse reading of the revlog data

299

with_sparse_read = attr.ib(default=False)

299

with_sparse_read = attr.ib(default=False)

300

# minimal density of a sparse read chunk

300

# minimal density of a sparse read chunk

301

sr_density_threshold = attr.ib(default=0.50)

301

sr_density_threshold = attr.ib(default=0.50)

302

# minimal size of data we skip when performing sparse read

302

# minimal size of data we skip when performing sparse read

303

sr_min_gap_size = attr.ib(default=262144)

303

sr_min_gap_size = attr.ib(default=262144)

304

305

# are delta encoded against arbitrary bases.

305

# are delta encoded against arbitrary bases.

306

generaldelta = attr.ib(default=False)

306

generaldelta = attr.ib(default=False)

307

308

309

@attr.s()

309

@attr.s()

310

class DeltaConfig(_Config):

310

class DeltaConfig(_Config):

311

"""Hold configuration value about how new delta are computed

311

"""Hold configuration value about how new delta are computed

312

313

Some attributes are duplicated from DataConfig to help havign each object

313

Some attributes are duplicated from DataConfig to help havign each object

314

self contained.

314

self contained.

315

"""

315

"""

316

317

# can delta be encoded against arbitrary bases.

317

# can delta be encoded against arbitrary bases.

318

general_delta = attr.ib(default=False)

318

general_delta = attr.ib(default=False)

319

# Allow sparse writing of the revlog data

319

# Allow sparse writing of the revlog data

320

sparse_revlog = attr.ib(default=False)

320

sparse_revlog = attr.ib(default=False)

321

# maximum length of a delta chain

321

# maximum length of a delta chain

322

max_chain_len = attr.ib(default=None)

322

max_chain_len = attr.ib(default=None)

323

# Maximum distance between delta chain base start and end

323

# Maximum distance between delta chain base start and end

324

max_deltachain_span = attr.ib(default=-1)

324

max_deltachain_span = attr.ib(default=-1)

325

# If `upper_bound_comp` is not None, this is the expected maximal gain from

325

# If `upper_bound_comp` is not None, this is the expected maximal gain from

326

# compression for the data content.

326

# compression for the data content.

327

upper_bound_comp = attr.ib(default=None)

327

upper_bound_comp = attr.ib(default=None)

328

# Should we try a delta against both parent

328

# Should we try a delta against both parent

329

delta_both_parents = attr.ib(default=True)

329

delta_both_parents = attr.ib(default=True)

330

# Test delta base candidate group by chunk of this maximal size.

330

# Test delta base candidate group by chunk of this maximal size.

331

candidate_group_chunk_size = attr.ib(default=0)

331

candidate_group_chunk_size = attr.ib(default=0)

332

# Should we display debug information about delta computation

332

# Should we display debug information about delta computation

333

debug_delta = attr.ib(default=False)

333

debug_delta = attr.ib(default=False)

334

# trust incoming delta by default

334

# trust incoming delta by default

335

lazy_delta = attr.ib(default=True)

335

lazy_delta = attr.ib(default=True)

336

# trust the base of incoming delta by default

336

# trust the base of incoming delta by default

337

lazy_delta_base = attr.ib(default=False)

337

lazy_delta_base = attr.ib(default=False)

338

339

340

class revlog:

340

class revlog:

341

"""

341

"""

342

the underlying revision storage object

342

the underlying revision storage object

343

344

A revlog consists of two parts, an index and the revision data.

344

A revlog consists of two parts, an index and the revision data.

345

346

The index is a file with a fixed record size containing

346

The index is a file with a fixed record size containing

347

information on each revision, including its nodeid (hash), the

347

information on each revision, including its nodeid (hash), the

348

nodeids of its parents, the position and offset of its data within

348

nodeids of its parents, the position and offset of its data within

349

the data file, and the revision it's based on. Finally, each entry

349

the data file, and the revision it's based on. Finally, each entry

350

contains a linkrev entry that can serve as a pointer to external

350

contains a linkrev entry that can serve as a pointer to external

351

data.

351

data.

352

353

The revision data itself is a linear collection of data chunks.

353

The revision data itself is a linear collection of data chunks.

354

Each chunk represents a revision and is usually represented as a

354

Each chunk represents a revision and is usually represented as a

355

delta against the previous chunk. To bound lookup time, runs of

355

delta against the previous chunk. To bound lookup time, runs of

356

deltas are limited to about 2 times the length of the original

356

deltas are limited to about 2 times the length of the original

357

version data. This makes retrieval of a version proportional to

357

version data. This makes retrieval of a version proportional to

358

its size, or O(1) relative to the number of revisions.

358

its size, or O(1) relative to the number of revisions.

359

360

Both pieces of the revlog are written to in an append-only

360

Both pieces of the revlog are written to in an append-only

361

fashion, which means we never need to rewrite a file to insert or

361

fashion, which means we never need to rewrite a file to insert or

362

remove data, and can use some simple techniques to avoid the need

362

remove data, and can use some simple techniques to avoid the need

363

for locking while reading.

363

for locking while reading.

364

365

If checkambig, indexfile is opened with checkambig=True at

365

If checkambig, indexfile is opened with checkambig=True at

366

writing, to avoid file stat ambiguity.

366

writing, to avoid file stat ambiguity.

367

368

If mmaplargeindex is True, and an mmapindexthreshold is set, the

368

If mmaplargeindex is True, and an mmapindexthreshold is set, the

369

index will be mmapped rather than read if it is larger than the

369

index will be mmapped rather than read if it is larger than the

370

configured threshold.

370

configured threshold.

371

372

If censorable is True, the revlog can have censored revisions.

372

If censorable is True, the revlog can have censored revisions.

373

374

If `upperboundcomp` is not None, this is the expected maximal gain from

374

If `upperboundcomp` is not None, this is the expected maximal gain from

375

compression for the data content.

375

compression for the data content.

376

377

`concurrencychecker` is an optional function that receives 3 arguments: a

377

`concurrencychecker` is an optional function that receives 3 arguments: a

378

file handle, a filename, and an expected position. It should check whether

378

file handle, a filename, and an expected position. It should check whether

379

the current position in the file handle is valid, and log/warn/fail (by

379

the current position in the file handle is valid, and log/warn/fail (by

380

raising).

380

raising).

381

382

See mercurial/revlogutils/contants.py for details about the content of an

382

See mercurial/revlogutils/contants.py for details about the content of an

383

index entry.

383

index entry.

384

"""

384

"""

385

386

_flagserrorclass = error.RevlogError

386

_flagserrorclass = error.RevlogError

387

388

@staticmethod

388

@staticmethod

389

def is_inline_index(header_bytes):

389

def is_inline_index(header_bytes):

390

"""Determine if a revlog is inline from the initial bytes of the index"""

390

"""Determine if a revlog is inline from the initial bytes of the index"""

391

header = INDEX_HEADER.unpack(header_bytes)[0]

391

header = INDEX_HEADER.unpack(header_bytes)[0]

392

393

_format_flags = header & ~0xFFFF

393

_format_flags = header & ~0xFFFF

394

_format_version = header & 0xFFFF

394

_format_version = header & 0xFFFF

395

396

features = FEATURES_BY_VERSION[_format_version]

396

features = FEATURES_BY_VERSION[_format_version]

397

return features[b'inline'](_format_flags)

397

return features[b'inline'](_format_flags)

398

399

def __init__(

399

def __init__(

400

self,

400

self,

401

opener,

401

opener,

402

target,

402

target,

403

radix,

403

radix,

404

postfix=None, # only exist for `tmpcensored` now

404

postfix=None, # only exist for `tmpcensored` now

405

checkambig=False,

405

checkambig=False,

406

mmaplargeindex=False,

406

mmaplargeindex=False,

407

censorable=False,

407

censorable=False,

408

upperboundcomp=None,

408

upperboundcomp=None,

409

persistentnodemap=False,

409

persistentnodemap=False,

410

concurrencychecker=None,

410

concurrencychecker=None,

411

trypending=False,

411

trypending=False,

412

try_split=False,

412

try_split=False,

413

canonical_parent_order=True,

413

canonical_parent_order=True,

414

):

414

):

415

"""

415

"""

416

create a revlog object

416

create a revlog object

417

418

opener is a function that abstracts the file opening operation

418

opener is a function that abstracts the file opening operation

419

and can be used to implement COW semantics or the like.

419

and can be used to implement COW semantics or the like.

420

421

`target`: a (KIND, ID) tuple that identify the content stored in

421

`target`: a (KIND, ID) tuple that identify the content stored in

422

this revlog. It help the rest of the code to understand what the revlog

422

this revlog. It help the rest of the code to understand what the revlog

423

is about without having to resort to heuristic and index filename

423

is about without having to resort to heuristic and index filename

424

analysis. Note: that this must be reliably be set by normal code, but

424

analysis. Note: that this must be reliably be set by normal code, but

425

that test, debug, or performance measurement code might not set this to

425

that test, debug, or performance measurement code might not set this to

426

accurate value.

426

accurate value.

427

"""

427

"""

428

self.upperboundcomp = upperboundcomp

428

self.upperboundcomp = upperboundcomp

429

430

self.radix = radix

430

self.radix = radix

431

432

self._docket_file = None

432

self._docket_file = None

433

self._indexfile = None

433

self._indexfile = None

434

self._datafile = None

434

self._datafile = None

435

self._sidedatafile = None

435

self._sidedatafile = None

436

self._nodemap_file = None

436

self._nodemap_file = None

437

self.postfix = postfix

437

self.postfix = postfix

438

self._trypending = trypending

438

self._trypending = trypending

439

self._try_split = try_split

439

self._try_split = try_split

440

self.opener = opener

440

self.opener = opener

441

if persistentnodemap:

441

if persistentnodemap:

442

self._nodemap_file = nodemaputil.get_nodemap_file(self)

442

self._nodemap_file = nodemaputil.get_nodemap_file(self)

443

444

assert target[0] in ALL_KINDS

444

assert target[0] in ALL_KINDS

445

assert len(target) == 2

445

assert len(target) == 2

446

self.target = target

446

self.target = target

447

if b'feature-config' in self.opener.options:

447

if b'feature-config' in self.opener.options:

448

self.feature_config = self.opener.options[b'feature-config'].copy()

448

self.feature_config = self.opener.options[b'feature-config'].copy()

449

else:

449

else:

450

self.feature_config = FeatureConfig()

450

self.feature_config = FeatureConfig()

451

self.feature_config.censorable = censorable

451

self.feature_config.censorable = censorable

452

self.feature_config.canonical_parent_order = canonical_parent_order

452

self.feature_config.canonical_parent_order = canonical_parent_order

453

if b'data-config' in self.opener.options:

453

if b'data-config' in self.opener.options:

454

self.data_config = self.opener.options[b'data-config'].copy()

454

self.data_config = self.opener.options[b'data-config'].copy()

455

else:

455

else:

456

self.data_config = DataConfig()

456

self.data_config = DataConfig()

457

self.data_config.check_ambig = checkambig

457

self.data_config.check_ambig = checkambig

458

self.data_config.mmap_large_index = mmaplargeindex

458

self.data_config.mmap_large_index = mmaplargeindex

459

if b'delta-config' in self.opener.options:

459

if b'delta-config' in self.opener.options:

460

self.delta_config = self.opener.options[b'delta-config'].copy()

460

self.delta_config = self.opener.options[b'delta-config'].copy()

461

else:

461

else:

462

self.delta_config = DeltaConfig()

462

self.delta_config = DeltaConfig()

463

464

# 3-tuple of (node, rev, text) for a raw revision.

464

# 3-tuple of (node, rev, text) for a raw revision.

465

self._revisioncache = None

465

self._revisioncache = None

466

# Maps rev to chain base rev.

466

# Maps rev to chain base rev.

467

self._chainbasecache = util.lrucachedict(100)

467

self._chainbasecache = util.lrucachedict(100)

468

# 2-tuple of (offset, data) of raw data from the revlog at an offset.

468

# 2-tuple of (offset, data) of raw data from the revlog at an offset.

469

self._chunkcache = (0, b'')

469

self._chunkcache = (0, b'')

470

471

self.index = None

471

self.index = None

472

self._docket = None

472

self._docket = None

473

self._nodemap_docket = None

473

self._nodemap_docket = None

474

# Mapping of partial identifiers to full nodes.

474

# Mapping of partial identifiers to full nodes.

475

self._pcache = {}

475

self._pcache = {}

476

477

# other optionnals features

477

# other optionnals features

478

479

# Make copy of flag processors so each revlog instance can support

479

# Make copy of flag processors so each revlog instance can support

480

# custom flags.

480

# custom flags.

481

self._flagprocessors = dict(flagutil.flagprocessors)

481

self._flagprocessors = dict(flagutil.flagprocessors)

482

483

# 3-tuple of file handles being used for active writing.

483

# 3-tuple of file handles being used for active writing.

484

self._writinghandles = None

484

self._writinghandles = None

485

# prevent nesting of addgroup

485

# prevent nesting of addgroup

486

self._adding_group = None

486

self._adding_group = None

487

488

self._loadindex()

488

self._loadindex()

489

490

self._concurrencychecker = concurrencychecker

490

self._concurrencychecker = concurrencychecker

491

492

@property

492

@property

493

def _generaldelta(self):

493

def _generaldelta(self):

494

"""temporary compatibility proxy"""

494

"""temporary compatibility proxy"""

495

return self.delta_config.general_delta

495

return self.delta_config.general_delta

496

497

@property

497

@property

498

def _checkambig(self):

498

def _checkambig(self):

499

"""temporary compatibility proxy"""

499

"""temporary compatibility proxy"""

500

return self.data_config.check_ambig

500

return self.data_config.check_ambig

501

502

@property

502

@property

503

def _mmaplargeindex(self):

503

def _mmaplargeindex(self):

504

"""temporary compatibility proxy"""

504

"""temporary compatibility proxy"""

505

return self.data_config.mmap_large_index

505

return self.data_config.mmap_large_index

506

507

@property

507

@property

508

def _censorable(self):

508

def _censorable(self):

509

"""temporary compatibility proxy"""

509

"""temporary compatibility proxy"""

510

return self.feature_config.censorable

510

return self.feature_config.censorable

511

512

@property

512

@property

513

def _chunkcachesize(self):

513

def _chunkcachesize(self):

514

"""temporary compatibility proxy"""

514

"""temporary compatibility proxy"""

515

return self.data_config.chunk_cache_size

515

return self.data_config.chunk_cache_size

516

517

@property

517

@property

518

def _maxchainlen(self):

518

def _maxchainlen(self):

519

"""temporary compatibility proxy"""

519

"""temporary compatibility proxy"""

520

return self.delta_config.max_chain_len

520

return self.delta_config.max_chain_len

521

522

@property

522

@property

523

def _deltabothparents(self):

523

def _deltabothparents(self):

524

"""temporary compatibility proxy"""

524

"""temporary compatibility proxy"""

525

return self.delta_config.delta_both_parents

525

return self.delta_config.delta_both_parents

526

527

@property

527

@property

528

def _candidate_group_chunk_size(self):

528

def _candidate_group_chunk_size(self):

529

"""temporary compatibility proxy"""

529

"""temporary compatibility proxy"""

530

return self.delta_config.candidate_group_chunk_size

530

return self.delta_config.candidate_group_chunk_size

531

532

@property

532

@property

533

def _debug_delta(self):

533

def _debug_delta(self):

534

"""temporary compatibility proxy"""

534

"""temporary compatibility proxy"""

535

return self.delta_config.debug_delta

535

return self.delta_config.debug_delta

536

537

@property

537

@property

538

def _compengine(self):

538

def _compengine(self):

539

"""temporary compatibility proxy"""

539

"""temporary compatibility proxy"""

540

return self.feature_config.compression_engine

540

return self.feature_config.compression_engine

541

542

@property

542

@property

543

def _compengineopts(self):

543

def _compengineopts(self):

544

"""temporary compatibility proxy"""

544

"""temporary compatibility proxy"""

545

return self.feature_config.compression_engine_options

545

return self.feature_config.compression_engine_options

546

547

@property

547

@property

548

def _maxdeltachainspan(self):

548

def _maxdeltachainspan(self):

549

"""temporary compatibility proxy"""

549

"""temporary compatibility proxy"""

550

return self.delta_config.max_deltachain_span

550

return self.delta_config.max_deltachain_span

551

552

@property

552

@property

553

def _withsparseread(self):

553

def _withsparseread(self):

554

"""temporary compatibility proxy"""

554

"""temporary compatibility proxy"""

555

return self.data_config.with_sparse_read

555

return self.data_config.with_sparse_read

556

557

@property

557

@property

558

def _sparserevlog(self):

558

def _sparserevlog(self):

559

"""temporary compatibility proxy"""

559

"""temporary compatibility proxy"""

560

return self.delta_config.sparse_revlog

560

return self.delta_config.sparse_revlog

561

562

@property

562

@property

563

def hassidedata(self):

563

def hassidedata(self):

564

"""temporary compatibility proxy"""

564

"""temporary compatibility proxy"""

565

return self.feature_config.has_side_data

565

return self.feature_config.has_side_data

566

567

@property

567

@property

568

def _srdensitythreshold(self):

568

def _srdensitythreshold(self):

569

"""temporary compatibility proxy"""

569

"""temporary compatibility proxy"""

570

return self.data_config.sr_density_threshold

570

return self.data_config.sr_density_threshold

571

572

@property

572

@property

573

def _srmingapsize(self):

573

def _srmingapsize(self):

574

"""temporary compatibility proxy"""

574

"""temporary compatibility proxy"""

575

return self.data_config.sr_min_gap_size

575

return self.data_config.sr_min_gap_size

576

577

@property

577

@property

578

def _compute_rank(self):

578

def _compute_rank(self):

579

"""temporary compatibility proxy"""

579

"""temporary compatibility proxy"""

580

return self.feature_config.compute_rank

580

return self.feature_config.compute_rank

581

582

@property

582

@property

583

def canonical_parent_order(self):

583

def canonical_parent_order(self):

584

"""temporary compatibility proxy"""

584

"""temporary compatibility proxy"""

585

return self.feature_config.canonical_parent_order

585

return self.feature_config.canonical_parent_order

586

587

@property

587

@property

588

def _lazydelta(self):

588

def _lazydelta(self):

589

"""temporary compatibility proxy"""

589

"""temporary compatibility proxy"""

590

return self.delta_config.lazy_delta

590

return self.delta_config.lazy_delta

591

592

@property

592

@property

593

def _lazydeltabase(self):

593

def _lazydeltabase(self):

594

"""temporary compatibility proxy"""

594

"""temporary compatibility proxy"""

595

return self.delta_config.lazy_delta_base

595

return self.delta_config.lazy_delta_base

596

597

def _init_opts(self):

597

def _init_opts(self):

598

"""process options (from above/config) to setup associated default revlog mode

598

"""process options (from above/config) to setup associated default revlog mode

599

600

These values might be affected when actually reading on disk information.

600

These values might be affected when actually reading on disk information.

601

602

The relevant values are returned for use in _loadindex().

602

The relevant values are returned for use in _loadindex().

603

604

* newversionflags:

604

* newversionflags:

605

version header to use if we need to create a new revlog

605

version header to use if we need to create a new revlog

606

607

* mmapindexthreshold:

607

* mmapindexthreshold:

608

minimal index size for start to use mmap

608

minimal index size for start to use mmap

609

610

* force_nodemap:

610

* force_nodemap:

611

force the usage of a "development" version of the nodemap code

611

force the usage of a "development" version of the nodemap code

612

"""

612

"""

613

opts = self.opener.options

613

opts = self.opener.options

614

615

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

615

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

616

new_header = CHANGELOGV2

616

new_header = CHANGELOGV2

617

compute_rank = opts.get(b'changelogv2.compute-rank', True)

617

compute_rank = opts.get(b'changelogv2.compute-rank', True)

618

self.feature_config.compute_rank = compute_rank

618

self.feature_config.compute_rank = compute_rank

619

elif b'revlogv2' in opts:

619

elif b'revlogv2' in opts:

620

new_header = REVLOGV2

620

new_header = REVLOGV2

621

elif b'revlogv1' in opts:

621

elif b'revlogv1' in opts:

622

new_header = REVLOGV1 | FLAG_INLINE_DATA

622

new_header = REVLOGV1 | FLAG_INLINE_DATA

623

if b'generaldelta' in opts:

623

if b'generaldelta' in opts:

624

new_header |= FLAG_GENERALDELTA

624

new_header |= FLAG_GENERALDELTA

625

elif b'revlogv0' in self.opener.options:

625

elif b'revlogv0' in self.opener.options:

626

new_header = REVLOGV0

626

new_header = REVLOGV0

627

else:

627

else:

628

new_header = REVLOG_DEFAULT_VERSION

628

new_header = REVLOG_DEFAULT_VERSION

629

630

mmapindexthreshold = None

630

mmapindexthreshold = None

631

if self.data_config.mmap_large_index:

631

if self.data_config.mmap_large_index:

632

mmapindexthreshold = self.data_config.mmap_index_threshold

632

mmapindexthreshold = self.data_config.mmap_index_threshold

633

if self.feature_config.enable_ellipsis:

633

if self.feature_config.enable_ellipsis:

634

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

634

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

635

636

# revlog v0 doesn't have flag processors

636

# revlog v0 doesn't have flag processors

637

for flag, processor in opts.get(b'flagprocessors', {}).items():

637

for flag, processor in opts.get(b'flagprocessors', {}).items():

638

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

638

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

639

640

chunk_cache_size = self.data_config.chunk_cache_size

640

chunk_cache_size = self.data_config.chunk_cache_size

641

if chunk_cache_size <= 0:

641

if chunk_cache_size <= 0:

642

raise error.RevlogError(

642

raise error.RevlogError(

643

_(b'revlog chunk cache size %r is not greater than 0')

643

_(b'revlog chunk cache size %r is not greater than 0')

644

% chunk_cache_size

644

% chunk_cache_size

645

)

645

)

646

elif chunk_cache_size & (chunk_cache_size - 1):

646

elif chunk_cache_size & (chunk_cache_size - 1):

647

raise error.RevlogError(

647

raise error.RevlogError(

648

_(b'revlog chunk cache size %r is not a power of 2')

648

_(b'revlog chunk cache size %r is not a power of 2')

649

% chunk_cache_size

649

% chunk_cache_size

650

)

650

)

651

force_nodemap = opts.get(b'devel-force-nodemap', False)

651

force_nodemap = opts.get(b'devel-force-nodemap', False)

652

return new_header, mmapindexthreshold, force_nodemap

652

return new_header, mmapindexthreshold, force_nodemap

653

654

def _get_data(self, filepath, mmap_threshold, size=None):

654

def _get_data(self, filepath, mmap_threshold, size=None):

655

"""return a file content with or without mmap

655

"""return a file content with or without mmap

656

657

If the file is missing return the empty string"""

657

If the file is missing return the empty string"""

658

try:

658

try:

659

with self.opener(filepath) as fp:

659

with self.opener(filepath) as fp:

660

if mmap_threshold is not None:

660

if mmap_threshold is not None:

661

file_size = self.opener.fstat(fp).st_size

661

file_size = self.opener.fstat(fp).st_size

662

if file_size >= mmap_threshold:

662

if file_size >= mmap_threshold:

663

if size is not None:

663

if size is not None:

664

# avoid potentiel mmap crash

664

# avoid potentiel mmap crash

665

size = min(file_size, size)

665

size = min(file_size, size)

666

# TODO: should .close() to release resources without

666

# TODO: should .close() to release resources without

667

# relying on Python GC

667

# relying on Python GC

668

if size is None:

668

if size is None:

669

return util.buffer(util.mmapread(fp))

669

return util.buffer(util.mmapread(fp))

670

else:

670

else:

671

return util.buffer(util.mmapread(fp, size))

671

return util.buffer(util.mmapread(fp, size))

672

if size is None:

672

if size is None:

673

return fp.read()

673

return fp.read()

674

else:

674

else:

675

return fp.read(size)

675

return fp.read(size)

676

except FileNotFoundError:

676

except FileNotFoundError:

677

return b''

677

return b''

678

679

def get_streams(self, max_linkrev, force_inline=False):

679

def get_streams(self, max_linkrev, force_inline=False):

680

"""return a list of streams that represent this revlog

680

"""return a list of streams that represent this revlog

681

682

This is used by stream-clone to do bytes to bytes copies of a repository.

682

This is used by stream-clone to do bytes to bytes copies of a repository.

683

684

This streams data for all revisions that refer to a changelog revision up

684

This streams data for all revisions that refer to a changelog revision up

685

to `max_linkrev`.

685

to `max_linkrev`.

686

687

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

687

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

688

689

It returns is a list of three-tuple:

689

It returns is a list of three-tuple:

690

691

[

691

[

692

(filename, bytes_stream, stream_size),

692

(filename, bytes_stream, stream_size),

693

…

693

…

694

]

694

]

695

"""

695

"""

696

n = len(self)

696

n = len(self)

697

index = self.index

697

index = self.index

698

while n > 0:

698

while n > 0:

699

linkrev = index[n - 1][4]

699

linkrev = index[n - 1][4]

700

if linkrev < max_linkrev:

700

if linkrev < max_linkrev:

701

break

701

break

702

# note: this loop will rarely go through multiple iterations, since

702

# note: this loop will rarely go through multiple iterations, since

703

# it only traverses commits created during the current streaming

703

# it only traverses commits created during the current streaming

704

# pull operation.

704

# pull operation.

705

#

705

#

706

# If this become a problem, using a binary search should cap the

706

# If this become a problem, using a binary search should cap the

707

# runtime of this.

707

# runtime of this.

708

n = n - 1

708

n = n - 1

709

if n == 0:

709

if n == 0:

710

# no data to send

710

# no data to send

711

return []

711

return []

712

index_size = n * index.entry_size

712

index_size = n * index.entry_size

713

data_size = self.end(n - 1)

713

data_size = self.end(n - 1)

714

715

# XXX we might have been split (or stripped) since the object

715

# XXX we might have been split (or stripped) since the object

716

# initialization, We need to close this race too, but having a way to

716

# initialization, We need to close this race too, but having a way to

717

# pre-open the file we feed to the revlog and never closing them before

717

# pre-open the file we feed to the revlog and never closing them before

718

# we are done streaming.

718

# we are done streaming.

719

720

if self._inline:

720

if self._inline:

721

722

def get_stream():

722

def get_stream():

723

with self._indexfp() as fp:

723

with self._indexfp() as fp:

724

yield None

724

yield None

725

size = index_size + data_size

725

size = index_size + data_size

726

if size <= 65536:

726

if size <= 65536:

727

yield fp.read(size)

727

yield fp.read(size)

728

else:

728

else:

729

yield from util.filechunkiter(fp, limit=size)

729

yield from util.filechunkiter(fp, limit=size)

730

731

inline_stream = get_stream()

731

inline_stream = get_stream()

732

next(inline_stream)

732

next(inline_stream)

733

return [

733

return [

734

(self._indexfile, inline_stream, index_size + data_size),

734

(self._indexfile, inline_stream, index_size + data_size),

735

]

735

]

736

elif force_inline:

736

elif force_inline:

737

738

def get_stream():

738

def get_stream():

739

with self.reading():

739

with self.reading():

740

yield None

740

yield None

741

742

for rev in range(n):

742

for rev in range(n):

743

idx = self.index.entry_binary(rev)

743

idx = self.index.entry_binary(rev)

744

if rev == 0 and self._docket is None:

744

if rev == 0 and self._docket is None:

745

# re-inject the inline flag

745

# re-inject the inline flag

746

header = self._format_flags

746

header = self._format_flags

747

header |= self._format_version

747

header |= self._format_version

748

header |= FLAG_INLINE_DATA

748

header |= FLAG_INLINE_DATA

749

header = self.index.pack_header(header)

749

header = self.index.pack_header(header)

750

idx = header + idx

750

idx = header + idx

751

yield idx

751

yield idx

752

yield self._getsegmentforrevs(rev, rev)[1]

752

yield self._getsegmentforrevs(rev, rev)[1]

753

754

inline_stream = get_stream()

754

inline_stream = get_stream()

755

next(inline_stream)

755

next(inline_stream)

756

return [

756

return [

757

(self._indexfile, inline_stream, index_size + data_size),

757

(self._indexfile, inline_stream, index_size + data_size),

758

]

758

]

759

else:

759

else:

760

761

def get_index_stream():

761

def get_index_stream():

762

with self._indexfp() as fp:

762

with self._indexfp() as fp:

763

yield None

763

yield None

764

if index_size <= 65536:

764

if index_size <= 65536:

765

yield fp.read(index_size)

765

yield fp.read(index_size)

766

else:

766

else:

767

yield from util.filechunkiter(fp, limit=index_size)

767

yield from util.filechunkiter(fp, limit=index_size)

768

769

def get_data_stream():

769

def get_data_stream():

770

with self._datafp() as fp:

770

with self._datafp() as fp:

771

yield None

771

yield None

772

if data_size <= 65536:

772

if data_size <= 65536:

773

yield fp.read(data_size)

773

yield fp.read(data_size)

774

else:

774

else:

775

yield from util.filechunkiter(fp, limit=data_size)

775

yield from util.filechunkiter(fp, limit=data_size)

776

777

index_stream = get_index_stream()

777

index_stream = get_index_stream()

778

next(index_stream)

778

next(index_stream)

779

data_stream = get_data_stream()

779

data_stream = get_data_stream()

780

next(data_stream)

780

next(data_stream)

781

return [

781

return [

782

(self._datafile, data_stream, data_size),

782

(self._datafile, data_stream, data_size),

783

(self._indexfile, index_stream, index_size),

783

(self._indexfile, index_stream, index_size),

784

]

784

]

785

786

def _loadindex(self, docket=None):

786

def _loadindex(self, docket=None):

787

788

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

788

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

789

790

if self.postfix is not None:

790

if self.postfix is not None:

791

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

791

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

792

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

792

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

793

entry_point = b'%s.i.a' % self.radix

793

entry_point = b'%s.i.a' % self.radix

794

elif self._try_split and self.opener.exists(self._split_index_file):

794

elif self._try_split and self.opener.exists(self._split_index_file):

795

entry_point = self._split_index_file

795

entry_point = self._split_index_file

796

else:

796

else:

797

entry_point = b'%s.i' % self.radix

797

entry_point = b'%s.i' % self.radix

798

799

if docket is not None:

799

if docket is not None:

800

self._docket = docket

800

self._docket = docket

801

self._docket_file = entry_point

801

self._docket_file = entry_point

802

else:

802

else:

803

self._initempty = True

803

self._initempty = True

804

entry_data = self._get_data(entry_point, mmapindexthreshold)

804

entry_data = self._get_data(entry_point, mmapindexthreshold)

805

if len(entry_data) > 0:

805

if len(entry_data) > 0:

806

header = INDEX_HEADER.unpack(entry_data[:4])[0]

806

header = INDEX_HEADER.unpack(entry_data[:4])[0]

807

self._initempty = False

807

self._initempty = False

808

else:

808

else:

809

header = new_header

809

header = new_header

810

811

self._format_flags = header & ~0xFFFF

811

self._format_flags = header & ~0xFFFF

812

self._format_version = header & 0xFFFF

812

self._format_version = header & 0xFFFF

813

814

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

814

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

815

if supported_flags is None:

815

if supported_flags is None:

816

msg = _(b'unknown version (%d) in revlog %s')

816

msg = _(b'unknown version (%d) in revlog %s')

817

msg %= (self._format_version, self.display_id)

817

msg %= (self._format_version, self.display_id)

818

raise error.RevlogError(msg)

818

raise error.RevlogError(msg)

819

elif self._format_flags & ~supported_flags:

819

elif self._format_flags & ~supported_flags:

820

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

820

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

821

display_flag = self._format_flags >> 16

821

display_flag = self._format_flags >> 16

822

msg %= (display_flag, self._format_version, self.display_id)

822

msg %= (display_flag, self._format_version, self.display_id)

823

raise error.RevlogError(msg)

823

raise error.RevlogError(msg)

824

825

features = FEATURES_BY_VERSION[self._format_version]

825

features = FEATURES_BY_VERSION[self._format_version]

826

self._inline = features[b'inline'](self._format_flags)

826

self._inline = features[b'inline'](self._format_flags)

827

self.delta_config.general_delta = features[b'generaldelta'](

827

self.delta_config.general_delta = features[b'generaldelta'](

828

self._format_flags

828

self._format_flags

829

)

829

)

830

self.feature_config.has_side_data = features[b'sidedata']

830

self.feature_config.has_side_data = features[b'sidedata']

831

832

if not features[b'docket']:

832

if not features[b'docket']:

833

self._indexfile = entry_point

833

self._indexfile = entry_point

834

index_data = entry_data

834

index_data = entry_data

835

else:

835

else:

836

self._docket_file = entry_point

836

self._docket_file = entry_point

837

if self._initempty:

837

if self._initempty:

838

self._docket = docketutil.default_docket(self, header)

838

self._docket = docketutil.default_docket(self, header)

839

else:

839

else:

840

self._docket = docketutil.parse_docket(

840

self._docket = docketutil.parse_docket(

841

self, entry_data, use_pending=self._trypending

841

self, entry_data, use_pending=self._trypending

842

)

842

)

843

844

if self._docket is not None:

844

if self._docket is not None:

845

self._indexfile = self._docket.index_filepath()

845

self._indexfile = self._docket.index_filepath()

846

index_data = b''

846

index_data = b''

847

index_size = self._docket.index_end

847

index_size = self._docket.index_end

848

if index_size > 0:

848

if index_size > 0:

849

index_data = self._get_data(

849

index_data = self._get_data(

850

self._indexfile, mmapindexthreshold, size=index_size

850

self._indexfile, mmapindexthreshold, size=index_size

851

)

851

)

852

if len(index_data) < index_size:

852

if len(index_data) < index_size:

853

msg = _(b'too few index data for %s: got %d, expected %d')

853

msg = _(b'too few index data for %s: got %d, expected %d')

854

msg %= (self.display_id, len(index_data), index_size)

854

msg %= (self.display_id, len(index_data), index_size)

855

raise error.RevlogError(msg)

855

raise error.RevlogError(msg)

856

857

self._inline = False

857

self._inline = False

858

# generaldelta implied by version 2 revlogs.

858

# generaldelta implied by version 2 revlogs.

859

self.delta_config.general_delta = True

859

self.delta_config.general_delta = True

860

# the logic for persistent nodemap will be dealt with within the

860

# the logic for persistent nodemap will be dealt with within the

861

# main docket, so disable it for now.

861

# main docket, so disable it for now.

862

self._nodemap_file = None

862

self._nodemap_file = None

863

864

if self._docket is not None:

864

if self._docket is not None:

865

self._datafile = self._docket.data_filepath()

865

self._datafile = self._docket.data_filepath()

866

self._sidedatafile = self._docket.sidedata_filepath()

866

self._sidedatafile = self._docket.sidedata_filepath()

867

elif self.postfix is None:

867

elif self.postfix is None:

868

self._datafile = b'%s.d' % self.radix

868

self._datafile = b'%s.d' % self.radix

869

else:

869

else:

870

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

870

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

871

872

self.nodeconstants = sha1nodeconstants

872

self.nodeconstants = sha1nodeconstants

873

self.nullid = self.nodeconstants.nullid

873

self.nullid = self.nodeconstants.nullid

874

875

# sparse-revlog can't be on without general-delta (issue6056)

875

# sparse-revlog can't be on without general-delta (issue6056)

876

if not self.delta_config.general_delta:

876

if not self.delta_config.general_delta:

877

self.delta_config.sparse_revlog = False

877

self.delta_config.sparse_revlog = False

878

879

self._storedeltachains = True

879

self._storedeltachains = True

880

881

devel_nodemap = (

881

devel_nodemap = (

882

self._nodemap_file

882

self._nodemap_file

883

and force_nodemap

883

and force_nodemap

884

and parse_index_v1_nodemap is not None

884

and parse_index_v1_nodemap is not None

885

)

885

)

886

887

use_rust_index = False

887

use_rust_index = False

888

if rustrevlog is not None:

888

if rustrevlog is not None:

889

if self._nodemap_file is not None:

889

if self._nodemap_file is not None:

890

use_rust_index = True

890

use_rust_index = True

891

else:

891

else:

892

use_rust_index = self.opener.options.get(b'rust.index')

892

use_rust_index = self.opener.options.get(b'rust.index')

893

894

self._parse_index = parse_index_v1

894

self._parse_index = parse_index_v1

895

if self._format_version == REVLOGV0:

895

if self._format_version == REVLOGV0:

896

self._parse_index = revlogv0.parse_index_v0

896

self._parse_index = revlogv0.parse_index_v0

897

elif self._format_version == REVLOGV2:

897

elif self._format_version == REVLOGV2:

898

self._parse_index = parse_index_v2

898

self._parse_index = parse_index_v2

899

elif self._format_version == CHANGELOGV2:

899

elif self._format_version == CHANGELOGV2:

900

self._parse_index = parse_index_cl_v2

900

self._parse_index = parse_index_cl_v2

901

elif devel_nodemap:

901

elif devel_nodemap:

902

self._parse_index = parse_index_v1_nodemap

902

self._parse_index = parse_index_v1_nodemap

903

elif use_rust_index:

903

elif use_rust_index:

904

self._parse_index = parse_index_v1_mixed

904

self._parse_index = parse_index_v1_mixed

905

try:

905

try:

906

d = self._parse_index(index_data, self._inline)

906

d = self._parse_index(index_data, self._inline)

907

index, chunkcache = d

907

index, chunkcache = d

908

use_nodemap = (

908

use_nodemap = (

909

not self._inline

909

not self._inline

910

and self._nodemap_file is not None

910

and self._nodemap_file is not None

911

and hasattr(index, 'update_nodemap_data')

911

and hasattr(index, 'update_nodemap_data')

912

)

912

)

913

if use_nodemap:

913

if use_nodemap:

914

nodemap_data = nodemaputil.persisted_data(self)

914

nodemap_data = nodemaputil.persisted_data(self)

915

if nodemap_data is not None:

915

if nodemap_data is not None:

916

docket = nodemap_data[0]

916

docket = nodemap_data[0]

917

if (

917

if (

918

len(d[0]) > docket.tip_rev

918

len(d[0]) > docket.tip_rev

919

and d[0][docket.tip_rev][7] == docket.tip_node

919

and d[0][docket.tip_rev][7] == docket.tip_node

920

):

920

):

921

# no changelog tampering

921

# no changelog tampering

922

self._nodemap_docket = docket

922

self._nodemap_docket = docket

923

index.update_nodemap_data(*nodemap_data)

923

index.update_nodemap_data(*nodemap_data)

924

except (ValueError, IndexError):

924

except (ValueError, IndexError):

925

raise error.RevlogError(

925

raise error.RevlogError(

926

_(b"index %s is corrupted") % self.display_id

926

_(b"index %s is corrupted") % self.display_id

927

)

927

)

928

self.index = index

928

self.index = index

929

self._segmentfile = randomaccessfile.randomaccessfile(

929

self._segmentfile = randomaccessfile.randomaccessfile(

930

self.opener,

930

self.opener,

931

(self._indexfile if self._inline else self._datafile),

931

(self._indexfile if self._inline else self._datafile),

932

self.data_config.chunk_cache_size,

932

self.data_config.chunk_cache_size,

933

chunkcache,

933

chunkcache,

934

)

934

)

935

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

935

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

936

self.opener,

936

self.opener,

937

self._sidedatafile,

937

self._sidedatafile,

938

self.data_config.chunk_cache_size,

938

self.data_config.chunk_cache_size,

939

)

939

)

940

# revnum -> (chain-length, sum-delta-length)

940

# revnum -> (chain-length, sum-delta-length)

941

self._chaininfocache = util.lrucachedict(500)

941

self._chaininfocache = util.lrucachedict(500)

942

# revlog header -> revlog compressor

942

# revlog header -> revlog compressor

943

self._decompressors = {}

943

self._decompressors = {}

944

945

def get_revlog(self):

945

def get_revlog(self):

946

"""simple function to mirror API of other not-really-revlog API"""

946

"""simple function to mirror API of other not-really-revlog API"""

947

return self

947

return self

948

949

@util.propertycache

949

@util.propertycache

950

def revlog_kind(self):

950

def revlog_kind(self):

951

return self.target[0]

951

return self.target[0]

952

953

@util.propertycache

953

@util.propertycache

954

def display_id(self):

954

def display_id(self):

955

"""The public facing "ID" of the revlog that we use in message"""

955

"""The public facing "ID" of the revlog that we use in message"""

956

if self.revlog_kind == KIND_FILELOG:

956

if self.revlog_kind == KIND_FILELOG:

957

# Reference the file without the "data/" prefix, so it is familiar

957

# Reference the file without the "data/" prefix, so it is familiar

958

# to the user.

958

# to the user.

959

return self.target[1]

959

return self.target[1]

960

else:

960

else:

961

return self.radix

961

return self.radix

962

963

def _get_decompressor(self, t):

963

def _get_decompressor(self, t):

964

try:

964

try:

965

compressor = self._decompressors[t]

965

compressor = self._decompressors[t]

966

except KeyError:

966

except KeyError:

967

try:

967

try:

968

engine = util.compengines.forrevlogheader(t)

968

engine = util.compengines.forrevlogheader(t)

969

compressor = engine.revlogcompressor(

969

compressor = engine.revlogcompressor(

970

self.feature_config.compression_engine_options

970

self.feature_config.compression_engine_options

971

)

971

)

972

self._decompressors[t] = compressor

972

self._decompressors[t] = compressor

973

except KeyError:

973

except KeyError:

974

raise error.RevlogError(

974

raise error.RevlogError(

975

_(b'unknown compression type %s') % binascii.hexlify(t)

975

_(b'unknown compression type %s') % binascii.hexlify(t)

976

)

976

)

977

return compressor

977

return compressor

978

979

@util.propertycache

979

@util.propertycache

980

def _compressor(self):

980

def _compressor(self):

981

engine = util.compengines[self.feature_config.compression_engine]

981

engine = util.compengines[self.feature_config.compression_engine]

982

return engine.revlogcompressor(

982

return engine.revlogcompressor(

983

self.feature_config.compression_engine_options

983

self.feature_config.compression_engine_options

984

)

984

)

985

986

@util.propertycache

986

@util.propertycache

987

def _decompressor(self):

987

def _decompressor(self):

988

"""the default decompressor"""

988

"""the default decompressor"""

989

if self._docket is None:

989

if self._docket is None:

990

return None

990

return None

991

t = self._docket.default_compression_header

991

t = self._docket.default_compression_header

992

c = self._get_decompressor(t)

992

c = self._get_decompressor(t)

993

return c.decompress

993

return c.decompress

994

995

def _indexfp(self):

995

def _indexfp(self):

996

"""file object for the revlog's index file"""

996

"""file object for the revlog's index file"""

997

return self.opener(self._indexfile, mode=b"r")

997

return self.opener(self._indexfile, mode=b"r")

998

999

def __index_write_fp(self):

999

def __index_write_fp(self):

1000

# You should not use this directly and use `_writing` instead

1000

# You should not use this directly and use `_writing` instead

1001

try:

1001

try:

1002

f = self.opener(

1002

f = self.opener(

1003

self._indexfile,

1003

self._indexfile,

1004

mode=b"r+",

1004

mode=b"r+",

1005

checkambig=self.data_config.check_ambig,

1005

checkambig=self.data_config.check_ambig,

1006

)

1006

)

1007

if self._docket is None:

1007

if self._docket is None:

1008

f.seek(0, os.SEEK_END)

1008

f.seek(0, os.SEEK_END)

1009

else:

1009

else:

1010

f.seek(self._docket.index_end, os.SEEK_SET)

1010

f.seek(self._docket.index_end, os.SEEK_SET)

1011

return f

1011

return f

1012

except FileNotFoundError:

1012

except FileNotFoundError:

1013

return self.opener(

1013

return self.opener(

1014

self._indexfile,

1014

self._indexfile,

1015

mode=b"w+",

1015

mode=b"w+",

1016

checkambig=self.data_config.check_ambig,

1016

checkambig=self.data_config.check_ambig,

1017

)

1017

)

1018

1019

def __index_new_fp(self):

1019

def __index_new_fp(self):

1020

# You should not use this unless you are upgrading from inline revlog

1020

# You should not use this unless you are upgrading from inline revlog

1021

return self.opener(

1021

return self.opener(

1022

self._indexfile,

1022

self._indexfile,

1023

mode=b"w",

1023

mode=b"w",

1024

checkambig=self.data_config.check_ambig,

1024

checkambig=self.data_config.check_ambig,

1025

atomictemp=True,

1025

atomictemp=True,

1026

)

1026

)

1027

1028

def _datafp(self, mode=b'r'):

1028

def _datafp(self, mode=b'r'):

1029

"""file object for the revlog's data file"""

1029

"""file object for the revlog's data file"""

1030

return self.opener(self._datafile, mode=mode)

1030

return self.opener(self._datafile, mode=mode)

1031

1032

@contextlib.contextmanager

1032

@contextlib.contextmanager

1033

def _sidedatareadfp(self):

1033

def _sidedatareadfp(self):

1034

"""file object suitable to read sidedata"""

1034

"""file object suitable to read sidedata"""

1035

if self._writinghandles:

1035

if self._writinghandles:

1036

yield self._writinghandles[2]

1036

yield self._writinghandles[2]

1037

else:

1037

else:

1038

with self.opener(self._sidedatafile) as fp:

1038

with self.opener(self._sidedatafile) as fp:

1039

yield fp

1039

yield fp

1040

1041

def tiprev(self):

1041

def tiprev(self):

1042

return len(self.index) - 1

1042

return len(self.index) - 1

1043

1044

def tip(self):

1044

def tip(self):

1045

return self.node(self.tiprev())

1045

return self.node(self.tiprev())

1046

1047

def __contains__(self, rev):

1047

def __contains__(self, rev):

1048

return 0 <= rev < len(self)

1048

return 0 <= rev < len(self)

1049

1050

def __len__(self):

1050

def __len__(self):

1051

return len(self.index)

1051

return len(self.index)

1052

1053

def __iter__(self):

1053

def __iter__(self):

1054

return iter(range(len(self)))

1054

return iter(range(len(self)))

1055

1056

def revs(self, start=0, stop=None):

1056

def revs(self, start=0, stop=None):

1057

"""iterate over all rev in this revlog (from start to stop)"""

1057

"""iterate over all rev in this revlog (from start to stop)"""

1058

return storageutil.iterrevs(len(self), start=start, stop=stop)

1058

return storageutil.iterrevs(len(self), start=start, stop=stop)

1059

1060

def hasnode(self, node):

1060

def hasnode(self, node):

1061

try:

1061

try:

1062

self.rev(node)

1062

self.rev(node)

1063

return True

1063

return True

1064

except KeyError:

1064

except KeyError:

1065

return False

1065

return False

1066

1067

def _candelta(self, baserev, rev):

1067

def _candelta(self, baserev, rev):

1068

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1068

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1069

# Disable delta if either rev requires a content-changing flag

1069

# Disable delta if either rev requires a content-changing flag

1070

# processor (ex. LFS). This is because such flag processor can alter

1070

# processor (ex. LFS). This is because such flag processor can alter

1071

# the rawtext content that the delta will be based on, and two clients

1071

# the rawtext content that the delta will be based on, and two clients

1072

# could have a same revlog node with different flags (i.e. different

1072

# could have a same revlog node with different flags (i.e. different

1073

# rawtext contents) and the delta could be incompatible.

1073

# rawtext contents) and the delta could be incompatible.

1074

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1074

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1075

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1075

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1076

):

1076

):

1077

return False

1077

return False

1078

return True

1078

return True

1079

1080

def update_caches(self, transaction):

1080

def update_caches(self, transaction):

1081

"""update on disk cache

1081

"""update on disk cache

1082

1083

If a transaction is passed, the update may be delayed to transaction

1083

If a transaction is passed, the update may be delayed to transaction

1084

commit."""

1084

commit."""

1085

if self._nodemap_file is not None:

1085

if self._nodemap_file is not None:

1086

if transaction is None:

1086

if transaction is None:

1087

nodemaputil.update_persistent_nodemap(self)

1087

nodemaputil.update_persistent_nodemap(self)

1088

else:

1088

else:

1089

nodemaputil.setup_persistent_nodemap(transaction, self)

1089

nodemaputil.setup_persistent_nodemap(transaction, self)

1090

1091

def clearcaches(self):

1091

def clearcaches(self):

1092

"""Clear in-memory caches"""

1092

"""Clear in-memory caches"""

1093

self._revisioncache = None

1093

self._revisioncache = None

1094

self._chainbasecache.clear()

1094

self._chainbasecache.clear()

1095

self._segmentfile.clear_cache()

1095

self._segmentfile.clear_cache()

1096

self._segmentfile_sidedata.clear_cache()

1096

self._segmentfile_sidedata.clear_cache()

1097

self._pcache = {}

1097

self._pcache = {}

1098

self._nodemap_docket = None

1098

self._nodemap_docket = None

1099

self.index.clearcaches()

1099

self.index.clearcaches()

1100

# The python code is the one responsible for validating the docket, we

1100

# The python code is the one responsible for validating the docket, we

1101

# end up having to refresh it here.

1101

# end up having to refresh it here.

1102

use_nodemap = (

1102

use_nodemap = (

1103

not self._inline

1103

not self._inline

1104

and self._nodemap_file is not None

1104

and self._nodemap_file is not None

1105

and hasattr(self.index, 'update_nodemap_data')

1105

and hasattr(self.index, 'update_nodemap_data')

1106

)

1106

)

1107

if use_nodemap:

1107

if use_nodemap:

1108

nodemap_data = nodemaputil.persisted_data(self)

1108

nodemap_data = nodemaputil.persisted_data(self)

1109

if nodemap_data is not None:

1109

if nodemap_data is not None:

1110

self._nodemap_docket = nodemap_data[0]

1110

self._nodemap_docket = nodemap_data[0]

1111

self.index.update_nodemap_data(*nodemap_data)

1111

self.index.update_nodemap_data(*nodemap_data)

1112

1113

def rev(self, node):

1113

def rev(self, node):

1114

"""return the revision number associated with a <nodeid>"""

1114

"""return the revision number associated with a <nodeid>"""

1115

try:

1115

try:

1116

return self.index.rev(node)

1116

return self.index.rev(node)

1117

except TypeError:

1117

except TypeError:

1118

raise

1118

raise

1119

except error.RevlogError:

1119

except error.RevlogError:

1120

# parsers.c radix tree lookup failed

1120

# parsers.c radix tree lookup failed

1121

if (

1121

if (

1122

node == self.nodeconstants.wdirid

1122

node == self.nodeconstants.wdirid

1123

or node in self.nodeconstants.wdirfilenodeids

1123

or node in self.nodeconstants.wdirfilenodeids

1124

):

1124

):

1125

raise error.WdirUnsupported

1125

raise error.WdirUnsupported

1126

raise error.LookupError(node, self.display_id, _(b'no node'))

1126

raise error.LookupError(node, self.display_id, _(b'no node'))

1127

1128

# Accessors for index entries.

1128

# Accessors for index entries.

1129

1130

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1130

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1131

# are flags.

1131

# are flags.

1132

def start(self, rev):

1132

def start(self, rev):

1133

return int(self.index[rev][0] >> 16)

1133

return int(self.index[rev][0] >> 16)

1134

1135

def sidedata_cut_off(self, rev):

1135

def sidedata_cut_off(self, rev):

1136

sd_cut_off = self.index[rev][8]

1136

sd_cut_off = self.index[rev][8]

1137

if sd_cut_off != 0:

1137

if sd_cut_off != 0:

1138

return sd_cut_off

1138

return sd_cut_off

1139

# This is some annoying dance, because entries without sidedata

1139

# This is some annoying dance, because entries without sidedata

1140

# currently use 0 as their ofsset. (instead of previous-offset +

1140

# currently use 0 as their ofsset. (instead of previous-offset +

1141

# previous-size)

1141

# previous-size)

1142

#

1142

#

1143

# We should reconsider this sidedata → 0 sidata_offset policy.

1143

# We should reconsider this sidedata → 0 sidata_offset policy.

1144

# In the meantime, we need this.

1144

# In the meantime, we need this.

1145

while 0 <= rev:

1145

while 0 <= rev:

1146

e = self.index[rev]

1146

e = self.index[rev]

1147

if e[9] != 0:

1147

if e[9] != 0:

1148

return e[8] + e[9]

1148

return e[8] + e[9]

1149

rev -= 1

1149

rev -= 1

1150

return 0

1150

return 0

1151

1152

def flags(self, rev):

1152

def flags(self, rev):

1153

return self.index[rev][0] & 0xFFFF

1153

return self.index[rev][0] & 0xFFFF

1154

1155

def length(self, rev):

1155

def length(self, rev):

1156

return self.index[rev][1]

1156

return self.index[rev][1]

1157

1158

def sidedata_length(self, rev):

1158

def sidedata_length(self, rev):

1159

if not self.feature_config.has_side_data:

1159

if not self.feature_config.has_side_data:

1160

return 0

1160

return 0

1161

return self.index[rev][9]

1161

return self.index[rev][9]

1162

1163

def rawsize(self, rev):

1163

def rawsize(self, rev):

1164

"""return the length of the uncompressed text for a given revision"""

1164

"""return the length of the uncompressed text for a given revision"""

1165

l = self.index[rev][2]

1165

l = self.index[rev][2]

1166

if l >= 0:

1166

if l >= 0:

1167

return l

1167

return l

1168

1169

t = self.rawdata(rev)

1169

t = self.rawdata(rev)

1170

return len(t)

1170

return len(t)

1171

1172

def size(self, rev):

1172

def size(self, rev):

1173

"""length of non-raw text (processed by a "read" flag processor)"""

1173

"""length of non-raw text (processed by a "read" flag processor)"""

1174

# fast path: if no "read" flag processor could change the content,

1174

# fast path: if no "read" flag processor could change the content,

1175

# size is rawsize. note: ELLIPSIS is known to not change the content.

1175

# size is rawsize. note: ELLIPSIS is known to not change the content.

1176

flags = self.flags(rev)

1176

flags = self.flags(rev)

1177

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1177

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1178

return self.rawsize(rev)

1178

return self.rawsize(rev)

1179

1180

return len(self.revision(rev))

1180

return len(self.revision(rev))

1181

1182

def fast_rank(self, rev):

1182

def fast_rank(self, rev):

1183

"""Return the rank of a revision if already known, or None otherwise.

1183

"""Return the rank of a revision if already known, or None otherwise.

1184

1185

The rank of a revision is the size of the sub-graph it defines as a

1185

The rank of a revision is the size of the sub-graph it defines as a

1186

head. Equivalently, the rank of a revision `r` is the size of the set

1186

head. Equivalently, the rank of a revision `r` is the size of the set

1187

`ancestors(r)`, `r` included.

1187

`ancestors(r)`, `r` included.

1188

1189

This method returns the rank retrieved from the revlog in constant

1189

This method returns the rank retrieved from the revlog in constant

1190

time. It makes no attempt at computing unknown values for versions of

1190

time. It makes no attempt at computing unknown values for versions of

1191

the revlog which do not persist the rank.

1191

the revlog which do not persist the rank.

1192

"""

1192

"""

1193

rank = self.index[rev][ENTRY_RANK]

1193

rank = self.index[rev][ENTRY_RANK]

1194

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1194

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1195

return None

1195

return None

1196

if rev == nullrev:

1196

if rev == nullrev:

1197

return 0 # convention

1197

return 0 # convention

1198

return rank

1198

return rank

1199

1200

def chainbase(self, rev):

1200

def chainbase(self, rev):

1201

base = self._chainbasecache.get(rev)

1201

base = self._chainbasecache.get(rev)

1202

if base is not None:

1202

if base is not None:

1203

return base

1203

return base

1204

1205

index = self.index

1205

index = self.index

1206

iterrev = rev

1206

iterrev = rev

1207

base = index[iterrev][3]

1207

base = index[iterrev][3]

1208

while base != iterrev:

1208

while base != iterrev:

1209

iterrev = base

1209

iterrev = base

1210

base = index[iterrev][3]

1210

base = index[iterrev][3]

1211

1212

self._chainbasecache[rev] = base

1212

self._chainbasecache[rev] = base

1213

return base

1213

return base

1214

1215

def linkrev(self, rev):

1215

def linkrev(self, rev):

1216

return self.index[rev][4]

1216

return self.index[rev][4]

1217

1218

def parentrevs(self, rev):

1218

def parentrevs(self, rev):

1219

try:

1219

try:

1220

entry = self.index[rev]

1220

entry = self.index[rev]

1221

except IndexError:

1221

except IndexError:

1222

if rev == wdirrev:

1222

if rev == wdirrev:

1223

raise error.WdirUnsupported

1223

raise error.WdirUnsupported

1224

raise

1224

raise

1225

1226

if self.canonical_parent_order and entry[5] == nullrev:

1226

if self.canonical_parent_order and entry[5] == nullrev:

1227

return entry[6], entry[5]

1227

return entry[6], entry[5]

1228

else:

1228

else:

1229

return entry[5], entry[6]

1229

return entry[5], entry[6]

1230

1231

# fast parentrevs(rev) where rev isn't filtered

1231

# fast parentrevs(rev) where rev isn't filtered

1232

_uncheckedparentrevs = parentrevs

1232

_uncheckedparentrevs = parentrevs

1233

1234

def node(self, rev):

1234

def node(self, rev):

1235

try:

1235

try:

1236

return self.index[rev][7]

1236

return self.index[rev][7]

1237

except IndexError:

1237

except IndexError:

1238

if rev == wdirrev:

1238

if rev == wdirrev:

1239

raise error.WdirUnsupported

1239

raise error.WdirUnsupported

1240

raise

1240

raise

1241

1242

# Derived from index values.

1242

# Derived from index values.

1243

1244

def end(self, rev):

1244

def end(self, rev):

1245

return self.start(rev) + self.length(rev)

1245

return self.start(rev) + self.length(rev)

1246

1247

def parents(self, node):

1247

def parents(self, node):

1248

i = self.index

1248

i = self.index

1249

d = i[self.rev(node)]

1249

d = i[self.rev(node)]

1250

# inline node() to avoid function call overhead

1250

# inline node() to avoid function call overhead

1251

if self.canonical_parent_order and d[5] == self.nullid:

1251

if self.canonical_parent_order and d[5] == self.nullid:

1252

return i[d[6]][7], i[d[5]][7]

1252

return i[d[6]][7], i[d[5]][7]

1253

else:

1253

else:

1254

return i[d[5]][7], i[d[6]][7]

1254

return i[d[5]][7], i[d[6]][7]

1255

1256

def chainlen(self, rev):

1256

def chainlen(self, rev):

1257

return self._chaininfo(rev)[0]

1257

return self._chaininfo(rev)[0]

1258

1259

def _chaininfo(self, rev):

1259

def _chaininfo(self, rev):

1260

chaininfocache = self._chaininfocache

1260

chaininfocache = self._chaininfocache

1261

if rev in chaininfocache:

1261

if rev in chaininfocache:

1262

return chaininfocache[rev]

1262

return chaininfocache[rev]

1263

index = self.index

1263

index = self.index

1264

generaldelta = self.delta_config.general_delta

1264

generaldelta = self.delta_config.general_delta

1265

iterrev = rev

1265

iterrev = rev

1266

e = index[iterrev]

1266

e = index[iterrev]

1267

clen = 0

1267

clen = 0

1268

compresseddeltalen = 0

1268

compresseddeltalen = 0

1269

while iterrev != e[3]:

1269

while iterrev != e[3]:

1270

clen += 1

1270

clen += 1

1271

compresseddeltalen += e[1]

1271

compresseddeltalen += e[1]

1272

if generaldelta:

1272

if generaldelta:

1273

iterrev = e[3]

1273

iterrev = e[3]

1274

else:

1274

else:

1275

iterrev -= 1

1275

iterrev -= 1

1276

if iterrev in chaininfocache:

1276

if iterrev in chaininfocache:

1277

t = chaininfocache[iterrev]

1277

t = chaininfocache[iterrev]

1278

clen += t[0]

1278

clen += t[0]

1279

compresseddeltalen += t[1]

1279

compresseddeltalen += t[1]

1280

break

1280

break

1281

e = index[iterrev]

1281

e = index[iterrev]

1282

else:

1282

else:

1283

# Add text length of base since decompressing that also takes

1283

# Add text length of base since decompressing that also takes

1284

# work. For cache hits the length is already included.

1284

# work. For cache hits the length is already included.

1285

compresseddeltalen += e[1]

1285

compresseddeltalen += e[1]

1286

r = (clen, compresseddeltalen)

1286

r = (clen, compresseddeltalen)

1287

chaininfocache[rev] = r

1287

chaininfocache[rev] = r

1288

return r

1288

return r

1289

1290

def _deltachain(self, rev, stoprev=None):

1290

def _deltachain(self, rev, stoprev=None):

1291

"""Obtain the delta chain for a revision.

1291

"""Obtain the delta chain for a revision.

1292

1293

``stoprev`` specifies a revision to stop at. If not specified, we

1293

``stoprev`` specifies a revision to stop at. If not specified, we

1294

stop at the base of the chain.

1294

stop at the base of the chain.

1295

1296

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

1296

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

1297

revs in ascending order and ``stopped`` is a bool indicating whether

1297

revs in ascending order and ``stopped`` is a bool indicating whether

1298

``stoprev`` was hit.

1298

``stoprev`` was hit.

1299

"""

1299

"""

1300

generaldelta = self.delta_config.general_delta

1300

generaldelta = self.delta_config.general_delta

1301

# Try C implementation.

1301

# Try C implementation.

1302

try:

1302

try:

1303

return self.index.deltachain(rev, stoprev, generaldelta)

1303

return self.index.deltachain(rev, stoprev, generaldelta)

1304

except AttributeError:

1304

except AttributeError:

1305

pass

1305

pass

1306

1307

chain = []

1307

chain = []

1308

1309

# Alias to prevent attribute lookup in tight loop.

1309

# Alias to prevent attribute lookup in tight loop.

1310

index = self.index

1310

index = self.index

1311

1312

iterrev = rev

1312

iterrev = rev

1313

e = index[iterrev]

1313

e = index[iterrev]

1314

while iterrev != e[3] and iterrev != stoprev:

1314

while iterrev != e[3] and iterrev != stoprev:

1315

chain.append(iterrev)

1315

chain.append(iterrev)

1316

if generaldelta:

1316

if generaldelta:

1317

iterrev = e[3]

1317

iterrev = e[3]

1318

else:

1318

else:

1319

iterrev -= 1

1319

iterrev -= 1

1320

e = index[iterrev]

1320

e = index[iterrev]

1321

1322

if iterrev == stoprev:

1322

if iterrev == stoprev:

1323

stopped = True

1323

stopped = True

1324

else:

1324

else:

1325

chain.append(iterrev)

1325

chain.append(iterrev)

1326

stopped = False

1326

stopped = False

1327

1328

chain.reverse()

1328

chain.reverse()

1329

return chain, stopped

1329

return chain, stopped

1330

1331

def ancestors(self, revs, stoprev=0, inclusive=False):

1331

def ancestors(self, revs, stoprev=0, inclusive=False):

1332

"""Generate the ancestors of 'revs' in reverse revision order.

1332

"""Generate the ancestors of 'revs' in reverse revision order.

1333

Does not generate revs lower than stoprev.

1333

Does not generate revs lower than stoprev.

1334

1335

See the documentation for ancestor.lazyancestors for more details."""

1335

See the documentation for ancestor.lazyancestors for more details."""

1336

1337

# first, make sure start revisions aren't filtered

1337

# first, make sure start revisions aren't filtered

1338

revs = list(revs)

1338

revs = list(revs)

1339

checkrev = self.node

1339

checkrev = self.node

1340

for r in revs:

1340

for r in revs:

1341

checkrev(r)

1341

checkrev(r)

1342

# and we're sure ancestors aren't filtered as well

1342

# and we're sure ancestors aren't filtered as well

1343

1344

if rustancestor is not None and self.index.rust_ext_compat:

1344

if rustancestor is not None and self.index.rust_ext_compat:

1345

lazyancestors = rustancestor.LazyAncestors

1345

lazyancestors = rustancestor.LazyAncestors

1346

arg = self.index

1346

arg = self.index

1347

else:

1347

else:

1348

lazyancestors = ancestor.lazyancestors

1348

lazyancestors = ancestor.lazyancestors

1349

arg = self._uncheckedparentrevs

1349

arg = self._uncheckedparentrevs

1350

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

1350

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

1351

1352

def descendants(self, revs):

1352

def descendants(self, revs):

1353

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

1353

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

1354

1355

def findcommonmissing(self, common=None, heads=None):

1355

def findcommonmissing(self, common=None, heads=None):

1356

"""Return a tuple of the ancestors of common and the ancestors of heads

1356

"""Return a tuple of the ancestors of common and the ancestors of heads

1357

that are not ancestors of common. In revset terminology, we return the

1357

that are not ancestors of common. In revset terminology, we return the

1358

tuple:

1358

tuple:

1359

1360

::common, (::heads) - (::common)

1360

::common, (::heads) - (::common)

1361

1362

The list is sorted by revision number, meaning it is

1362

The list is sorted by revision number, meaning it is

1363

topologically sorted.

1363

topologically sorted.

1364

1365

'heads' and 'common' are both lists of node IDs. If heads is

1365

'heads' and 'common' are both lists of node IDs. If heads is

1366

not supplied, uses all of the revlog's heads. If common is not

1366

not supplied, uses all of the revlog's heads. If common is not

1367

supplied, uses nullid."""

1367

supplied, uses nullid."""

1368

if common is None:

1368

if common is None:

1369

common = [self.nullid]

1369

common = [self.nullid]

1370

if heads is None:

1370

if heads is None:

1371

heads = self.heads()

1371

heads = self.heads()

1372

1373

common = [self.rev(n) for n in common]

1373

common = [self.rev(n) for n in common]

1374

heads = [self.rev(n) for n in heads]

1374

heads = [self.rev(n) for n in heads]

1375

1376

# we want the ancestors, but inclusive

1376

# we want the ancestors, but inclusive

1377

class lazyset:

1377

class lazyset:

1378

def __init__(self, lazyvalues):

1378

def __init__(self, lazyvalues):

1379

self.addedvalues = set()

1379

self.addedvalues = set()

1380

self.lazyvalues = lazyvalues

1380

self.lazyvalues = lazyvalues

1381

1382

def __contains__(self, value):

1382

def __contains__(self, value):

1383

return value in self.addedvalues or value in self.lazyvalues

1383

return value in self.addedvalues or value in self.lazyvalues

1384

1385

def __iter__(self):

1385

def __iter__(self):

1386

added = self.addedvalues

1386

added = self.addedvalues

1387

for r in added:

1387

for r in added:

1388

yield r

1388

yield r

1389

for r in self.lazyvalues:

1389

for r in self.lazyvalues:

1390

if not r in added:

1390

if not r in added:

1391

yield r

1391

yield r

1392

1393

def add(self, value):

1393

def add(self, value):

1394

self.addedvalues.add(value)

1394

self.addedvalues.add(value)

1395

1396

def update(self, values):

1396

def update(self, values):

1397

self.addedvalues.update(values)

1397

self.addedvalues.update(values)

1398

1399

has = lazyset(self.ancestors(common))

1399

has = lazyset(self.ancestors(common))

1400

has.add(nullrev)

1400

has.add(nullrev)

1401

has.update(common)

1401

has.update(common)

1402

1403

# take all ancestors from heads that aren't in has

1403

# take all ancestors from heads that aren't in has

1404

missing = set()

1404

missing = set()

1405

visit = collections.deque(r for r in heads if r not in has)

1405

visit = collections.deque(r for r in heads if r not in has)

1406

while visit:

1406

while visit:

1407

r = visit.popleft()

1407

r = visit.popleft()

1408

if r in missing:

1408

if r in missing:

1409

continue

1409

continue

1410

else:

1410

else:

1411

missing.add(r)

1411

missing.add(r)

1412

for p in self.parentrevs(r):

1412

for p in self.parentrevs(r):

1413

if p not in has:

1413

if p not in has:

1414

visit.append(p)

1414

visit.append(p)

1415

missing = list(missing)

1415

missing = list(missing)

1416

missing.sort()

1416

missing.sort()

1417

return has, [self.node(miss) for miss in missing]

1417

return has, [self.node(miss) for miss in missing]

1418

1419

def incrementalmissingrevs(self, common=None):

1419

def incrementalmissingrevs(self, common=None):

1420

"""Return an object that can be used to incrementally compute the

1420

"""Return an object that can be used to incrementally compute the

1421

revision numbers of the ancestors of arbitrary sets that are not

1421

revision numbers of the ancestors of arbitrary sets that are not

1422

ancestors of common. This is an ancestor.incrementalmissingancestors

1422

ancestors of common. This is an ancestor.incrementalmissingancestors

1423

object.

1423

object.

1424

1425

'common' is a list of revision numbers. If common is not supplied, uses

1425

'common' is a list of revision numbers. If common is not supplied, uses

1426

nullrev.

1426

nullrev.

1427

"""

1427

"""

1428

if common is None:

1428

if common is None:

1429

common = [nullrev]

1429

common = [nullrev]

1430

1431

if rustancestor is not None and self.index.rust_ext_compat:

1431

if rustancestor is not None and self.index.rust_ext_compat:

1432

return rustancestor.MissingAncestors(self.index, common)

1432

return rustancestor.MissingAncestors(self.index, common)

1433

return ancestor.incrementalmissingancestors(self.parentrevs, common)

1433

return ancestor.incrementalmissingancestors(self.parentrevs, common)

1434

1435

def findmissingrevs(self, common=None, heads=None):

1435

def findmissingrevs(self, common=None, heads=None):

1436

"""Return the revision numbers of the ancestors of heads that

1436

"""Return the revision numbers of the ancestors of heads that

1437

are not ancestors of common.

1437

are not ancestors of common.

1438

1439

More specifically, return a list of revision numbers corresponding to

1439

More specifically, return a list of revision numbers corresponding to

1440

nodes N such that every N satisfies the following constraints:

1440

nodes N such that every N satisfies the following constraints:

1441

1442

1. N is an ancestor of some node in 'heads'

1442

1. N is an ancestor of some node in 'heads'

1443

2. N is not an ancestor of any node in 'common'

1443

2. N is not an ancestor of any node in 'common'

1444

1445

The list is sorted by revision number, meaning it is

1445

The list is sorted by revision number, meaning it is

1446

topologically sorted.

1446

topologically sorted.

1447

1448

'heads' and 'common' are both lists of revision numbers. If heads is

1448

'heads' and 'common' are both lists of revision numbers. If heads is

1449

not supplied, uses all of the revlog's heads. If common is not

1449

not supplied, uses all of the revlog's heads. If common is not

1450

supplied, uses nullid."""

1450

supplied, uses nullid."""

1451

if common is None:

1451

if common is None:

1452

common = [nullrev]

1452

common = [nullrev]

1453

if heads is None:

1453

if heads is None:

1454

heads = self.headrevs()

1454

heads = self.headrevs()

1455

1456

inc = self.incrementalmissingrevs(common=common)

1456

inc = self.incrementalmissingrevs(common=common)

1457

return inc.missingancestors(heads)

1457

return inc.missingancestors(heads)

1458

1459

def findmissing(self, common=None, heads=None):

1459

def findmissing(self, common=None, heads=None):

1460

"""Return the ancestors of heads that are not ancestors of common.

1460

"""Return the ancestors of heads that are not ancestors of common.

1461

1462

More specifically, return a list of nodes N such that every N

1462

More specifically, return a list of nodes N such that every N

1463

satisfies the following constraints:

1463

satisfies the following constraints:

1464

1465

1. N is an ancestor of some node in 'heads'

1465

1. N is an ancestor of some node in 'heads'

1466

2. N is not an ancestor of any node in 'common'

1466

2. N is not an ancestor of any node in 'common'

1467

1468

The list is sorted by revision number, meaning it is

1468

The list is sorted by revision number, meaning it is

1469

topologically sorted.

1469

topologically sorted.

1470

1471

'heads' and 'common' are both lists of node IDs. If heads is

1471

'heads' and 'common' are both lists of node IDs. If heads is

1472

not supplied, uses all of the revlog's heads. If common is not

1472

not supplied, uses all of the revlog's heads. If common is not

1473

supplied, uses nullid."""

1473

supplied, uses nullid."""

1474

if common is None:

1474

if common is None:

1475

common = [self.nullid]

1475

common = [self.nullid]

1476

if heads is None:

1476

if heads is None:

1477

heads = self.heads()

1477

heads = self.heads()

1478

1479

common = [self.rev(n) for n in common]

1479

common = [self.rev(n) for n in common]

1480

heads = [self.rev(n) for n in heads]

1480

heads = [self.rev(n) for n in heads]

1481

1482

inc = self.incrementalmissingrevs(common=common)

1482

inc = self.incrementalmissingrevs(common=common)

1483

return [self.node(r) for r in inc.missingancestors(heads)]

1483

return [self.node(r) for r in inc.missingancestors(heads)]

1484

1485

def nodesbetween(self, roots=None, heads=None):

1485

def nodesbetween(self, roots=None, heads=None):

1486

"""Return a topological path from 'roots' to 'heads'.

1486

"""Return a topological path from 'roots' to 'heads'.

1487

1488

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

1488

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

1489

topologically sorted list of all nodes N that satisfy both of

1489

topologically sorted list of all nodes N that satisfy both of

1490

these constraints:

1490

these constraints:

1491

1492

1. N is a descendant of some node in 'roots'

1492

1. N is a descendant of some node in 'roots'

1493

2. N is an ancestor of some node in 'heads'

1493

2. N is an ancestor of some node in 'heads'

1494

1495

Every node is considered to be both a descendant and an ancestor

1495

Every node is considered to be both a descendant and an ancestor

1496

of itself, so every reachable node in 'roots' and 'heads' will be

1496

of itself, so every reachable node in 'roots' and 'heads' will be

1497

included in 'nodes'.

1497

included in 'nodes'.

1498

1499

'outroots' is the list of reachable nodes in 'roots', i.e., the

1499

'outroots' is the list of reachable nodes in 'roots', i.e., the

1500

subset of 'roots' that is returned in 'nodes'. Likewise,

1500

subset of 'roots' that is returned in 'nodes'. Likewise,

1501

'outheads' is the subset of 'heads' that is also in 'nodes'.

1501

'outheads' is the subset of 'heads' that is also in 'nodes'.

1502

1503

'roots' and 'heads' are both lists of node IDs. If 'roots' is

1503

'roots' and 'heads' are both lists of node IDs. If 'roots' is

1504

unspecified, uses nullid as the only root. If 'heads' is

1504

unspecified, uses nullid as the only root. If 'heads' is

1505

unspecified, uses list of all of the revlog's heads."""

1505

unspecified, uses list of all of the revlog's heads."""

1506

nonodes = ([], [], [])

1506

nonodes = ([], [], [])

1507

if roots is not None:

1507

if roots is not None:

1508

roots = list(roots)

1508

roots = list(roots)

1509

if not roots:

1509

if not roots:

1510

return nonodes

1510

return nonodes

1511

lowestrev = min([self.rev(n) for n in roots])

1511

lowestrev = min([self.rev(n) for n in roots])

1512

else:

1512

else:

1513

roots = [self.nullid] # Everybody's a descendant of nullid

1513

roots = [self.nullid] # Everybody's a descendant of nullid

1514

lowestrev = nullrev

1514

lowestrev = nullrev

1515

if (lowestrev == nullrev) and (heads is None):

1515

if (lowestrev == nullrev) and (heads is None):

1516

# We want _all_ the nodes!

1516

# We want _all_ the nodes!

1517

return (

1517

return (

1518

[self.node(r) for r in self],

1518

[self.node(r) for r in self],

1519

[self.nullid],

1519

[self.nullid],

1520

list(self.heads()),

1520

list(self.heads()),

1521

)

1521

)

1522

if heads is None:

1522

if heads is None:

1523

# All nodes are ancestors, so the latest ancestor is the last

1523

# All nodes are ancestors, so the latest ancestor is the last

1524

# node.

1524

# node.

1525

highestrev = len(self) - 1

1525

highestrev = len(self) - 1

1526

# Set ancestors to None to signal that every node is an ancestor.

1526

# Set ancestors to None to signal that every node is an ancestor.

1527

ancestors = None

1527

ancestors = None

1528

# Set heads to an empty dictionary for later discovery of heads

1528

# Set heads to an empty dictionary for later discovery of heads

1529

heads = {}

1529

heads = {}

1530

else:

1530

else:

1531

heads = list(heads)

1531

heads = list(heads)

1532

if not heads:

1532

if not heads:

1533

return nonodes

1533

return nonodes

1534

ancestors = set()

1534

ancestors = set()

1535

# Turn heads into a dictionary so we can remove 'fake' heads.

1535

# Turn heads into a dictionary so we can remove 'fake' heads.

1536

# Also, later we will be using it to filter out the heads we can't

1536

# Also, later we will be using it to filter out the heads we can't

1537

# find from roots.

1537

# find from roots.

1538

heads = dict.fromkeys(heads, False)

1538

heads = dict.fromkeys(heads, False)

1539

# Start at the top and keep marking parents until we're done.

1539

# Start at the top and keep marking parents until we're done.

1540

nodestotag = set(heads)

1540

nodestotag = set(heads)

1541

# Remember where the top was so we can use it as a limit later.

1541

# Remember where the top was so we can use it as a limit later.

1542

highestrev = max([self.rev(n) for n in nodestotag])

1542

highestrev = max([self.rev(n) for n in nodestotag])

1543

while nodestotag:

1543

while nodestotag:

1544

# grab a node to tag

1544

# grab a node to tag

1545

n = nodestotag.pop()

1545

n = nodestotag.pop()

1546

# Never tag nullid

1546

# Never tag nullid

1547

if n == self.nullid:

1547

if n == self.nullid:

1548

continue

1548

continue

1549

# A node's revision number represents its place in a

1549

# A node's revision number represents its place in a

1550

# topologically sorted list of nodes.

1550

# topologically sorted list of nodes.

1551

r = self.rev(n)

1551

r = self.rev(n)

1552

if r >= lowestrev:

1552

if r >= lowestrev:

1553

if n not in ancestors:

1553

if n not in ancestors:

1554

# If we are possibly a descendant of one of the roots

1554

# If we are possibly a descendant of one of the roots

1555

# and we haven't already been marked as an ancestor

1555

# and we haven't already been marked as an ancestor

1556

ancestors.add(n) # Mark as ancestor

1556

ancestors.add(n) # Mark as ancestor

1557

# Add non-nullid parents to list of nodes to tag.

1557

# Add non-nullid parents to list of nodes to tag.

1558

nodestotag.update(

1558

nodestotag.update(

1559

[p for p in self.parents(n) if p != self.nullid]

1559

[p for p in self.parents(n) if p != self.nullid]

1560

)

1560

)

1561

elif n in heads: # We've seen it before, is it a fake head?

1561

elif n in heads: # We've seen it before, is it a fake head?

1562

# So it is, real heads should not be the ancestors of

1562

# So it is, real heads should not be the ancestors of

1563

# any other heads.

1563

# any other heads.

1564

heads.pop(n)

1564

heads.pop(n)

1565

if not ancestors:

1565

if not ancestors:

1566

return nonodes

1566

return nonodes

1567

# Now that we have our set of ancestors, we want to remove any

1567

# Now that we have our set of ancestors, we want to remove any

1568

# roots that are not ancestors.

1568

# roots that are not ancestors.

1569

1570

# If one of the roots was nullid, everything is included anyway.

1570

# If one of the roots was nullid, everything is included anyway.

1571

if lowestrev > nullrev:

1571

if lowestrev > nullrev:

1572

# But, since we weren't, let's recompute the lowest rev to not

1572

# But, since we weren't, let's recompute the lowest rev to not

1573

# include roots that aren't ancestors.

1573

# include roots that aren't ancestors.

1574

1575

# Filter out roots that aren't ancestors of heads

1575

# Filter out roots that aren't ancestors of heads

1576

roots = [root for root in roots if root in ancestors]

1576

roots = [root for root in roots if root in ancestors]

1577

# Recompute the lowest revision

1577

# Recompute the lowest revision

1578

if roots:

1578

if roots:

1579

lowestrev = min([self.rev(root) for root in roots])

1579

lowestrev = min([self.rev(root) for root in roots])

1580

else:

1580

else:

1581

# No more roots? Return empty list

1581

# No more roots? Return empty list

1582

return nonodes

1582

return nonodes

1583

else:

1583

else:

1584

# We are descending from nullid, and don't need to care about

1584

# We are descending from nullid, and don't need to care about

1585

# any other roots.

1585

# any other roots.

1586

lowestrev = nullrev

1586

lowestrev = nullrev

1587

roots = [self.nullid]

1587

roots = [self.nullid]

1588

# Transform our roots list into a set.

1588

# Transform our roots list into a set.

1589

descendants = set(roots)

1589

descendants = set(roots)

1590

# Also, keep the original roots so we can filter out roots that aren't

1590

# Also, keep the original roots so we can filter out roots that aren't

1591

# 'real' roots (i.e. are descended from other roots).

1591

# 'real' roots (i.e. are descended from other roots).

1592

roots = descendants.copy()

1592

roots = descendants.copy()

1593

# Our topologically sorted list of output nodes.

1593

# Our topologically sorted list of output nodes.

1594

orderedout = []

1594

orderedout = []

1595

# Don't start at nullid since we don't want nullid in our output list,

1595

# Don't start at nullid since we don't want nullid in our output list,

1596

# and if nullid shows up in descendants, empty parents will look like

1596

# and if nullid shows up in descendants, empty parents will look like

1597

# they're descendants.

1597

# they're descendants.

1598

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

1598

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

1599

n = self.node(r)

1599

n = self.node(r)

1600

isdescendant = False

1600

isdescendant = False

1601

if lowestrev == nullrev: # Everybody is a descendant of nullid

1601

if lowestrev == nullrev: # Everybody is a descendant of nullid

1602

isdescendant = True

1602

isdescendant = True

1603

elif n in descendants:

1603

elif n in descendants:

1604

# n is already a descendant

1604

# n is already a descendant

1605

isdescendant = True

1605

isdescendant = True

1606

# This check only needs to be done here because all the roots

1606

# This check only needs to be done here because all the roots

1607

# will start being marked is descendants before the loop.

1607

# will start being marked is descendants before the loop.

1608

if n in roots:

1608

if n in roots:

1609

# If n was a root, check if it's a 'real' root.

1609

# If n was a root, check if it's a 'real' root.

1610

p = tuple(self.parents(n))

1610

p = tuple(self.parents(n))

1611

# If any of its parents are descendants, it's not a root.

1611

# If any of its parents are descendants, it's not a root.

1612

if (p[0] in descendants) or (p[1] in descendants):

1612

if (p[0] in descendants) or (p[1] in descendants):

1613

roots.remove(n)

1613

roots.remove(n)

1614

else:

1614

else:

1615

p = tuple(self.parents(n))

1615

p = tuple(self.parents(n))

1616

# A node is a descendant if either of its parents are

1616

# A node is a descendant if either of its parents are

1617

# descendants. (We seeded the dependents list with the roots

1617

# descendants. (We seeded the dependents list with the roots

1618

# up there, remember?)

1618

# up there, remember?)

1619

if (p[0] in descendants) or (p[1] in descendants):

1619

if (p[0] in descendants) or (p[1] in descendants):

1620

descendants.add(n)

1620

descendants.add(n)

1621

isdescendant = True

1621

isdescendant = True

1622

if isdescendant and ((ancestors is None) or (n in ancestors)):

1622

if isdescendant and ((ancestors is None) or (n in ancestors)):

1623

# Only include nodes that are both descendants and ancestors.

1623

# Only include nodes that are both descendants and ancestors.

1624

orderedout.append(n)

1624

orderedout.append(n)

1625

if (ancestors is not None) and (n in heads):

1625

if (ancestors is not None) and (n in heads):

1626

# We're trying to figure out which heads are reachable

1626

# We're trying to figure out which heads are reachable

1627

# from roots.

1627

# from roots.

1628

# Mark this head as having been reached

1628

# Mark this head as having been reached

1629

heads[n] = True

1629

heads[n] = True

1630

elif ancestors is None:

1630

elif ancestors is None:

1631

# Otherwise, we're trying to discover the heads.

1631

# Otherwise, we're trying to discover the heads.

1632

# Assume this is a head because if it isn't, the next step

1632

# Assume this is a head because if it isn't, the next step

1633

# will eventually remove it.

1633

# will eventually remove it.

1634

heads[n] = True

1634

heads[n] = True

1635

# But, obviously its parents aren't.

1635

# But, obviously its parents aren't.

1636

for p in self.parents(n):

1636

for p in self.parents(n):

1637

heads.pop(p, None)

1637

heads.pop(p, None)

1638

heads = [head for head, flag in heads.items() if flag]

1638

heads = [head for head, flag in heads.items() if flag]

1639

roots = list(roots)

1639

roots = list(roots)

1640

assert orderedout

1640

assert orderedout

1641

assert roots

1641

assert roots

1642

assert heads

1642

assert heads

1643

return (orderedout, roots, heads)

1643

return (orderedout, roots, heads)

1644

1645

def headrevs(self, revs=None):

1645

def headrevs(self, revs=None):

1646

if revs is None:

1646

if revs is None:

1647

try:

1647

try:

1648

return self.index.headrevs()

1648

return self.index.headrevs()

1649

except AttributeError:

1649

except AttributeError:

1650

return self._headrevs()

1650

return self._headrevs()

1651

if rustdagop is not None and self.index.rust_ext_compat:

1651

if rustdagop is not None and self.index.rust_ext_compat:

1652

return rustdagop.headrevs(self.index, revs)

1652

return rustdagop.headrevs(self.index, revs)

1653

return dagop.headrevs(revs, self._uncheckedparentrevs)

1653

return dagop.headrevs(revs, self._uncheckedparentrevs)

1654

1655

def computephases(self, roots):

1655

def computephases(self, roots):

1656

return self.index.computephasesmapsets(roots)

1656

return self.index.computephasesmapsets(roots)

1657

1658

def _headrevs(self):

1658

def _headrevs(self):

1659

count = len(self)

1659

count = len(self)

1660

if not count:

1660

if not count:

1661

return [nullrev]

1661

return [nullrev]

1662

# we won't iter over filtered rev so nobody is a head at start

1662

# we won't iter over filtered rev so nobody is a head at start

1663

ishead = [0] * (count + 1)

1663

ishead = [0] * (count + 1)

1664

index = self.index

1664

index = self.index

1665

for r in self:

1665

for r in self:

1666

ishead[r] = 1 # I may be an head

1666

ishead[r] = 1 # I may be an head

1667

e = index[r]

1667

e = index[r]

1668

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

1668

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

1669

return [r for r, val in enumerate(ishead) if val]

1669

return [r for r, val in enumerate(ishead) if val]

1670

1671

def heads(self, start=None, stop=None):

1671

def heads(self, start=None, stop=None):

1672

"""return the list of all nodes that have no children

1672

"""return the list of all nodes that have no children

1673

1674

if start is specified, only heads that are descendants of

1674

if start is specified, only heads that are descendants of

1675

start will be returned

1675

start will be returned

1676

if stop is specified, it will consider all the revs from stop

1676

if stop is specified, it will consider all the revs from stop

1677

as if they had no children

1677

as if they had no children

1678

"""

1678

"""

1679

if start is None and stop is None:

1679

if start is None and stop is None:

1680

if not len(self):

1680

if not len(self):

1681

return [self.nullid]

1681

return [self.nullid]

1682

return [self.node(r) for r in self.headrevs()]

1682

return [self.node(r) for r in self.headrevs()]

1683

1684

if start is None:

1684

if start is None:

1685

start = nullrev

1685

start = nullrev

1686

else:

1686

else:

1687

start = self.rev(start)

1687

start = self.rev(start)

1688

1689

stoprevs = {self.rev(n) for n in stop or []}

1689

stoprevs = {self.rev(n) for n in stop or []}

1690

1691

revs = dagop.headrevssubset(

1691

revs = dagop.headrevssubset(

1692

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

1692

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

1693

)

1693

)

1694

1695

return [self.node(rev) for rev in revs]

1695

return [self.node(rev) for rev in revs]

1696

1697

def children(self, node):

1697

def children(self, node):

1698

"""find the children of a given node"""

1698

"""find the children of a given node"""

1699

c = []

1699

c = []

1700

p = self.rev(node)

1700

p = self.rev(node)

1701

for r in self.revs(start=p + 1):

1701

for r in self.revs(start=p + 1):

1702

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

1702

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

1703

if prevs:

1703

if prevs:

1704

for pr in prevs:

1704

for pr in prevs:

1705

if pr == p:

1705

if pr == p:

1706

c.append(self.node(r))

1706

c.append(self.node(r))

1707

elif p == nullrev:

1707

elif p == nullrev:

1708

c.append(self.node(r))

1708

c.append(self.node(r))

1709

return c

1709

return c

1710

1711

def commonancestorsheads(self, a, b):

1711

def commonancestorsheads(self, a, b):

1712

"""calculate all the heads of the common ancestors of nodes a and b"""

1712

"""calculate all the heads of the common ancestors of nodes a and b"""

1713

a, b = self.rev(a), self.rev(b)

1713

a, b = self.rev(a), self.rev(b)

1714

ancs = self._commonancestorsheads(a, b)

1714

ancs = self._commonancestorsheads(a, b)

1715

return pycompat.maplist(self.node, ancs)

1715

return pycompat.maplist(self.node, ancs)

1716

1717

def _commonancestorsheads(self, *revs):

1717

def _commonancestorsheads(self, *revs):

1718

"""calculate all the heads of the common ancestors of revs"""

1718

"""calculate all the heads of the common ancestors of revs"""

1719

try:

1719

try:

1720

ancs = self.index.commonancestorsheads(*revs)

1720

ancs = self.index.commonancestorsheads(*revs)

1721

except (AttributeError, OverflowError): # C implementation failed

1721

except (AttributeError, OverflowError): # C implementation failed

1722

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

1722

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

1723

return ancs

1723

return ancs

1724

1725

def isancestor(self, a, b):

1725

def isancestor(self, a, b):

1726

"""return True if node a is an ancestor of node b

1726

"""return True if node a is an ancestor of node b

1727

1728

A revision is considered an ancestor of itself."""

1728

A revision is considered an ancestor of itself."""

1729

a, b = self.rev(a), self.rev(b)

1729

a, b = self.rev(a), self.rev(b)

1730

return self.isancestorrev(a, b)

1730

return self.isancestorrev(a, b)

1731

1732

def isancestorrev(self, a, b):

1732

def isancestorrev(self, a, b):

1733

"""return True if revision a is an ancestor of revision b

1733

"""return True if revision a is an ancestor of revision b

1734

1735

A revision is considered an ancestor of itself.

1735

A revision is considered an ancestor of itself.

1736

1737

The implementation of this is trivial but the use of

1737

The implementation of this is trivial but the use of

1738

reachableroots is not."""

1738

reachableroots is not."""

1739

if a == nullrev:

1739

if a == nullrev:

1740

return True

1740

return True

1741

elif a == b:

1741

elif a == b:

1742

return True

1742

return True

1743

elif a > b:

1743

elif a > b:

1744

return False

1744

return False

1745

return bool(self.reachableroots(a, [b], [a], includepath=False))

1745

return bool(self.reachableroots(a, [b], [a], includepath=False))

1746

1747

def reachableroots(self, minroot, heads, roots, includepath=False):

1747

def reachableroots(self, minroot, heads, roots, includepath=False):

1748

"""return (heads(::(<roots> and <roots>::<heads>)))

1748

"""return (heads(::(<roots> and <roots>::<heads>)))

1749

1750

If includepath is True, return (<roots>::<heads>)."""

1750

If includepath is True, return (<roots>::<heads>)."""

1751

try:

1751

try:

1752

return self.index.reachableroots2(

1752

return self.index.reachableroots2(

1753

minroot, heads, roots, includepath

1753

minroot, heads, roots, includepath

1754

)

1754

)

1755

except AttributeError:

1755

except AttributeError:

1756

return dagop._reachablerootspure(

1756

return dagop._reachablerootspure(

1757

self.parentrevs, minroot, roots, heads, includepath

1757

self.parentrevs, minroot, roots, heads, includepath

1758

)

1758

)

1759

1760

def ancestor(self, a, b):

1760

def ancestor(self, a, b):

1761

"""calculate the "best" common ancestor of nodes a and b"""

1761

"""calculate the "best" common ancestor of nodes a and b"""

1762

1763

a, b = self.rev(a), self.rev(b)

1763

a, b = self.rev(a), self.rev(b)

1764

try:

1764

try:

1765

ancs = self.index.ancestors(a, b)

1765

ancs = self.index.ancestors(a, b)

1766

except (AttributeError, OverflowError):

1766

except (AttributeError, OverflowError):

1767

ancs = ancestor.ancestors(self.parentrevs, a, b)

1767

ancs = ancestor.ancestors(self.parentrevs, a, b)

1768

if ancs:

1768

if ancs:

1769

# choose a consistent winner when there's a tie

1769

# choose a consistent winner when there's a tie

1770

return min(map(self.node, ancs))

1770

return min(map(self.node, ancs))

1771

return self.nullid

1771

return self.nullid

1772

1773

def _match(self, id):

1773

def _match(self, id):

1774

if isinstance(id, int):

1774

if isinstance(id, int):

1775

# rev

1775

# rev

1776

return self.node(id)

1776

return self.node(id)

1777

if len(id) == self.nodeconstants.nodelen:

1777

if len(id) == self.nodeconstants.nodelen:

1778

# possibly a binary node

1778

# possibly a binary node

1779

# odds of a binary node being all hex in ASCII are 1 in 10**25

1779

# odds of a binary node being all hex in ASCII are 1 in 10**25

1780

try:

1780

try:

1781

node = id

1781

node = id

1782

self.rev(node) # quick search the index

1782

self.rev(node) # quick search the index

1783

return node

1783

return node

1784

except error.LookupError:

1784

except error.LookupError:

1785

pass # may be partial hex id

1785

pass # may be partial hex id

1786

try:

1786

try:

1787

# str(rev)

1787

# str(rev)

1788

rev = int(id)

1788

rev = int(id)

1789

if b"%d" % rev != id:

1789

if b"%d" % rev != id:

1790

raise ValueError

1790

raise ValueError

1791

if rev < 0:

1791

if rev < 0:

1792

rev = len(self) + rev

1792

rev = len(self) + rev

1793

if rev < 0 or rev >= len(self):

1793

if rev < 0 or rev >= len(self):

1794

raise ValueError

1794

raise ValueError

1795

return self.node(rev)

1795

return self.node(rev)

1796

except (ValueError, OverflowError):

1796

except (ValueError, OverflowError):

1797

pass

1797

pass

1798

if len(id) == 2 * self.nodeconstants.nodelen:

1798

if len(id) == 2 * self.nodeconstants.nodelen:

1799

try:

1799

try:

1800

# a full hex nodeid?

1800

# a full hex nodeid?

1801

node = bin(id)

1801

node = bin(id)

1802

self.rev(node)

1802

self.rev(node)

1803

return node

1803

return node

1804

except (binascii.Error, error.LookupError):

1804

except (binascii.Error, error.LookupError):

1805

pass

1805

pass

1806

1807

def _partialmatch(self, id):

1807

def _partialmatch(self, id):

1808

# we don't care wdirfilenodeids as they should be always full hash

1808

# we don't care wdirfilenodeids as they should be always full hash

1809

maybewdir = self.nodeconstants.wdirhex.startswith(id)

1809

maybewdir = self.nodeconstants.wdirhex.startswith(id)

1810

ambiguous = False

1810

ambiguous = False

1811

try:

1811

try:

1812

partial = self.index.partialmatch(id)

1812

partial = self.index.partialmatch(id)

1813

if partial and self.hasnode(partial):

1813

if partial and self.hasnode(partial):

1814

if maybewdir:

1814

if maybewdir:

1815

# single 'ff...' match in radix tree, ambiguous with wdir

1815

# single 'ff...' match in radix tree, ambiguous with wdir

1816

ambiguous = True

1816

ambiguous = True

1817

else:

1817

else:

1818

return partial

1818

return partial

1819

elif maybewdir:

1819

elif maybewdir:

1820

# no 'ff...' match in radix tree, wdir identified

1820

# no 'ff...' match in radix tree, wdir identified

1821

raise error.WdirUnsupported

1821

raise error.WdirUnsupported

1822

else:

1822

else:

1823

return None

1823

return None

1824

except error.RevlogError:

1824

except error.RevlogError:

1825

# parsers.c radix tree lookup gave multiple matches

1825

# parsers.c radix tree lookup gave multiple matches

1826

# fast path: for unfiltered changelog, radix tree is accurate

1826

# fast path: for unfiltered changelog, radix tree is accurate

1827

if not getattr(self, 'filteredrevs', None):

1827

if not getattr(self, 'filteredrevs', None):

1828

ambiguous = True

1828

ambiguous = True

1829

# fall through to slow path that filters hidden revisions

1829

# fall through to slow path that filters hidden revisions

1830

except (AttributeError, ValueError):

1830

except (AttributeError, ValueError):

1831

# we are pure python, or key is not hex

1831

# we are pure python, or key is not hex

1832

pass

1832

pass

1833

if ambiguous:

1833

if ambiguous:

1834

raise error.AmbiguousPrefixLookupError(

1834

raise error.AmbiguousPrefixLookupError(

1835

id, self.display_id, _(b'ambiguous identifier')

1835

id, self.display_id, _(b'ambiguous identifier')

1836

)

1836

)

1837

1838

if id in self._pcache:

1838

if id in self._pcache:

1839

return self._pcache[id]

1839

return self._pcache[id]

1840

1841

if len(id) <= 40:

1841

if len(id) <= 40:

1842

# hex(node)[:...]

1842

# hex(node)[:...]

1843

l = len(id) // 2 * 2 # grab an even number of digits

1843

l = len(id) // 2 * 2 # grab an even number of digits

1844

try:

1844

try:

1845

# we're dropping the last digit, so let's check that it's hex,

1845

# we're dropping the last digit, so let's check that it's hex,

1846

# to avoid the expensive computation below if it's not

1846

# to avoid the expensive computation below if it's not

1847

if len(id) % 2 > 0:

1847

if len(id) % 2 > 0:

1848

if not (id[-1] in hexdigits):

1848

if not (id[-1] in hexdigits):

1849

return None

1849

return None

1850

prefix = bin(id[:l])

1850

prefix = bin(id[:l])

1851

except binascii.Error:

1851

except binascii.Error:

1852

pass

1852

pass

1853

else:

1853

else:

1854

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

1854

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

1855

nl = [

1855

nl = [

1856

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

1856

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

1857

]

1857

]

1858

if self.nodeconstants.nullhex.startswith(id):

1858

if self.nodeconstants.nullhex.startswith(id):

1859

nl.append(self.nullid)

1859

nl.append(self.nullid)

1860

if len(nl) > 0:

1860

if len(nl) > 0:

1861

if len(nl) == 1 and not maybewdir:

1861

if len(nl) == 1 and not maybewdir:

1862

self._pcache[id] = nl[0]

1862

self._pcache[id] = nl[0]

1863

return nl[0]

1863

return nl[0]

1864

raise error.AmbiguousPrefixLookupError(

1864

raise error.AmbiguousPrefixLookupError(

1865

id, self.display_id, _(b'ambiguous identifier')

1865

id, self.display_id, _(b'ambiguous identifier')

1866

)

1866

)

1867

if maybewdir:

1867

if maybewdir:

1868

raise error.WdirUnsupported

1868

raise error.WdirUnsupported

1869

return None

1869

return None

1870

1871

def lookup(self, id):

1871

def lookup(self, id):

1872

"""locate a node based on:

1872

"""locate a node based on:

1873

- revision number or str(revision number)

1873

- revision number or str(revision number)

1874

- nodeid or subset of hex nodeid

1874

- nodeid or subset of hex nodeid

1875

"""

1875

"""

1876

n = self._match(id)

1876

n = self._match(id)

1877

if n is not None:

1877

if n is not None:

1878

return n

1878

return n

1879

n = self._partialmatch(id)

1879

n = self._partialmatch(id)

1880

if n:

1880

if n:

1881

return n

1881

return n

1882

1883

raise error.LookupError(id, self.display_id, _(b'no match found'))

1883

raise error.LookupError(id, self.display_id, _(b'no match found'))

1884

1885

def shortest(self, node, minlength=1):

1885

def shortest(self, node, minlength=1):

1886

"""Find the shortest unambiguous prefix that matches node."""

1886

"""Find the shortest unambiguous prefix that matches node."""

1887

1888

def isvalid(prefix):

1888

def isvalid(prefix):

1889

try:

1889

try:

1890

matchednode = self._partialmatch(prefix)

1890

matchednode = self._partialmatch(prefix)

1891

except error.AmbiguousPrefixLookupError:

1891

except error.AmbiguousPrefixLookupError:

1892

return False

1892

return False

1893

except error.WdirUnsupported:

1893

except error.WdirUnsupported:

1894

# single 'ff...' match

1894

# single 'ff...' match

1895

return True

1895

return True

1896

if matchednode is None:

1896

if matchednode is None:

1897

raise error.LookupError(node, self.display_id, _(b'no node'))

1897

raise error.LookupError(node, self.display_id, _(b'no node'))

1898

return True

1898

return True

1899

1900

def maybewdir(prefix):

1900

def maybewdir(prefix):

1901

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

1901

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

1902

1903

hexnode = hex(node)

1903

hexnode = hex(node)

1904

1905

def disambiguate(hexnode, minlength):

1905

def disambiguate(hexnode, minlength):

1906

"""Disambiguate against wdirid."""

1906

"""Disambiguate against wdirid."""

1907

for length in range(minlength, len(hexnode) + 1):

1907

for length in range(minlength, len(hexnode) + 1):

1908

prefix = hexnode[:length]

1908

prefix = hexnode[:length]

1909

if not maybewdir(prefix):

1909

if not maybewdir(prefix):

1910

return prefix

1910

return prefix

1911

1912

if not getattr(self, 'filteredrevs', None):

1912

if not getattr(self, 'filteredrevs', None):

1913

try:

1913

try:

1914

length = max(self.index.shortest(node), minlength)

1914

length = max(self.index.shortest(node), minlength)

1915

return disambiguate(hexnode, length)

1915

return disambiguate(hexnode, length)

1916

except error.RevlogError:

1916

except error.RevlogError:

1917

if node != self.nodeconstants.wdirid:

1917

if node != self.nodeconstants.wdirid:

1918

raise error.LookupError(

1918

raise error.LookupError(

1919

node, self.display_id, _(b'no node')

1919

node, self.display_id, _(b'no node')

1920

)

1920

)

1921

except AttributeError:

1921

except AttributeError:

1922

# Fall through to pure code

1922

# Fall through to pure code

1923

pass

1923

pass

1924

1925

if node == self.nodeconstants.wdirid:

1925

if node == self.nodeconstants.wdirid:

1926

for length in range(minlength, len(hexnode) + 1):

1926

for length in range(minlength, len(hexnode) + 1):

1927

prefix = hexnode[:length]

1927

prefix = hexnode[:length]

1928

if isvalid(prefix):

1928

if isvalid(prefix):

1929

return prefix

1929

return prefix

1930

1931

for length in range(minlength, len(hexnode) + 1):

1931

for length in range(minlength, len(hexnode) + 1):

1932

prefix = hexnode[:length]

1932

prefix = hexnode[:length]

1933

if isvalid(prefix):

1933

if isvalid(prefix):

1934

return disambiguate(hexnode, length)

1934

return disambiguate(hexnode, length)

1935

1936

def cmp(self, node, text):

1936

def cmp(self, node, text):

1937

"""compare text with a given file revision

1937

"""compare text with a given file revision

1938

1939

returns True if text is different than what is stored.

1939

returns True if text is different than what is stored.

1940

"""

1940

"""

1941

p1, p2 = self.parents(node)

1941

p1, p2 = self.parents(node)

1942

return storageutil.hashrevisionsha1(text, p1, p2) != node

1942

return storageutil.hashrevisionsha1(text, p1, p2) != node

1943

1944

def _getsegmentforrevs(self, startrev, endrev):

1944

def _getsegmentforrevs(self, startrev, endrev):

1945

"""Obtain a segment of raw data corresponding to a range of revisions.

1945

"""Obtain a segment of raw data corresponding to a range of revisions.

1946

1947

Accepts the start and end revisions and an optional already-open

1947

Accepts the start and end revisions and an optional already-open

1948

file handle to be used for reading. If the file handle is read, its

1948

file handle to be used for reading. If the file handle is read, its

1949

seek position will not be preserved.

1949

seek position will not be preserved.

1950

1951

Requests for data may be satisfied by a cache.

1951

Requests for data may be satisfied by a cache.

1952

1953

Returns a 2-tuple of (offset, data) for the requested range of

1953

Returns a 2-tuple of (offset, data) for the requested range of

1954

revisions. Offset is the integer offset from the beginning of the

1954

revisions. Offset is the integer offset from the beginning of the

1955

revlog and data is a str or buffer of the raw byte data.

1955

revlog and data is a str or buffer of the raw byte data.

1956

1957

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

1957

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

1958

to determine where each revision's data begins and ends.

1958

to determine where each revision's data begins and ends.

1959

"""

1959

"""

1960

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

1960

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

1961

# (functions are expensive).

1961

# (functions are expensive).

1962

index = self.index

1962

index = self.index

1963

istart = index[startrev]

1963

istart = index[startrev]

1964

start = int(istart[0] >> 16)

1964

start = int(istart[0] >> 16)

1965

if startrev == endrev:

1965

if startrev == endrev:

1966

end = start + istart[1]

1966

end = start + istart[1]

1967

else:

1967

else:

1968

iend = index[endrev]

1968

iend = index[endrev]

1969

end = int(iend[0] >> 16) + iend[1]

1969

end = int(iend[0] >> 16) + iend[1]

1970

1971

if self._inline:

1971

if self._inline:

1972

start += (startrev + 1) * self.index.entry_size

1972

start += (startrev + 1) * self.index.entry_size

1973

end += (endrev + 1) * self.index.entry_size

1973

end += (endrev + 1) * self.index.entry_size

1974

length = end - start

1974

length = end - start

1975

1976

return start, self._segmentfile.read_chunk(start, length)

1976

return start, self._segmentfile.read_chunk(start, length)

1977

1978

def _chunk(self, rev):

1978

def _chunk(self, rev):

1979

"""Obtain a single decompressed chunk for a revision.

1979

"""Obtain a single decompressed chunk for a revision.

1980

1981

Accepts an integer revision and an optional already-open file handle

1981

Accepts an integer revision and an optional already-open file handle

1982

to be used for reading. If used, the seek position of the file will not

1982

to be used for reading. If used, the seek position of the file will not

1983

be preserved.

1983

be preserved.

1984

1985

Returns a str holding uncompressed data for the requested revision.

1985

Returns a str holding uncompressed data for the requested revision.

1986

"""

1986

"""

1987

compression_mode = self.index[rev][10]

1987

compression_mode = self.index[rev][10]

1988

data = self._getsegmentforrevs(rev, rev)[1]

1988

data = self._getsegmentforrevs(rev, rev)[1]

1989

if compression_mode == COMP_MODE_PLAIN:

1989

if compression_mode == COMP_MODE_PLAIN:

1990

return data

1990

return data

1991

elif compression_mode == COMP_MODE_DEFAULT:

1991

elif compression_mode == COMP_MODE_DEFAULT:

1992

return self._decompressor(data)

1992

return self._decompressor(data)

1993

elif compression_mode == COMP_MODE_INLINE:

1993

elif compression_mode == COMP_MODE_INLINE:

1994

return self.decompress(data)

1994

return self.decompress(data)

1995

else:

1995

else:

1996

msg = b'unknown compression mode %d'

1996

msg = b'unknown compression mode %d'

1997

msg %= compression_mode

1997

msg %= compression_mode

1998

raise error.RevlogError(msg)

1998

raise error.RevlogError(msg)

1999

2000

def _chunks(self, revs, targetsize=None):

2000

def _chunks(self, revs, targetsize=None):

2001

"""Obtain decompressed chunks for the specified revisions.

2001

"""Obtain decompressed chunks for the specified revisions.

2002

2003

Accepts an iterable of numeric revisions that are assumed to be in

2003

Accepts an iterable of numeric revisions that are assumed to be in

2004

ascending order. Also accepts an optional already-open file handle

2004

ascending order. Also accepts an optional already-open file handle

2005

to be used for reading. If used, the seek position of the file will

2005

to be used for reading. If used, the seek position of the file will

2006

not be preserved.

2006

not be preserved.

2007

2008

This function is similar to calling ``self._chunk()`` multiple times,

2008

This function is similar to calling ``self._chunk()`` multiple times,

2009

but is faster.

2009

but is faster.

2010

2011

Returns a list with decompressed data for each requested revision.

2011

Returns a list with decompressed data for each requested revision.

2012

"""

2012

"""

2013

if not revs:

2013

if not revs:

2014

return []

2014

return []

2015

start = self.start

2015

start = self.start

2016

length = self.length

2016

length = self.length

2017

inline = self._inline

2017

inline = self._inline

2018

iosize = self.index.entry_size

2018

iosize = self.index.entry_size

2019

buffer = util.buffer

2019

buffer = util.buffer

2020

2021

l = []

2021

l = []

2022

ladd = l.append

2022

ladd = l.append

2023

2024

if not self.data_config.with_sparse_read:

2024

if not self.data_config.with_sparse_read:

2025

slicedchunks = (revs,)

2025

slicedchunks = (revs,)

2026

else:

2026

else:

2027

slicedchunks = deltautil.slicechunk(

2027

slicedchunks = deltautil.slicechunk(

2028

self, revs, targetsize=targetsize

2028

self, revs, targetsize=targetsize

2029

)

2029

)

2030

2031

for revschunk in slicedchunks:

2031

for revschunk in slicedchunks:

2032

firstrev = revschunk[0]

2032

firstrev = revschunk[0]

2033

# Skip trailing revisions with empty diff

2033

# Skip trailing revisions with empty diff

2034

for lastrev in revschunk[::-1]:

2034

for lastrev in revschunk[::-1]:

2035

if length(lastrev) != 0:

2035

if length(lastrev) != 0:

2036

break

2036

break

2037

2038

try:

2038

try:

2039

offset, data = self._getsegmentforrevs(firstrev, lastrev)

2039

offset, data = self._getsegmentforrevs(firstrev, lastrev)

2040

except OverflowError:

2040

except OverflowError:

2041

# issue4215 - we can't cache a run of chunks greater than

2041

# issue4215 - we can't cache a run of chunks greater than

2042

# 2G on Windows

2042

# 2G on Windows

2043

return [self._chunk(rev) for rev in revschunk]

2043

return [self._chunk(rev) for rev in revschunk]

2044

2045

decomp = self.decompress

2045

decomp = self.decompress

2046

# self._decompressor might be None, but will not be used in that case

2046

# self._decompressor might be None, but will not be used in that case

2047

def_decomp = self._decompressor

2047

def_decomp = self._decompressor

2048

for rev in revschunk:

2048

for rev in revschunk:

2049

chunkstart = start(rev)

2049

chunkstart = start(rev)

2050

if inline:

2050

if inline:

2051

chunkstart += (rev + 1) * iosize

2051

chunkstart += (rev + 1) * iosize

2052

chunklength = length(rev)

2052

chunklength = length(rev)

2053

comp_mode = self.index[rev][10]

2053

comp_mode = self.index[rev][10]

2054

c = buffer(data, chunkstart - offset, chunklength)

2054

c = buffer(data, chunkstart - offset, chunklength)

2055

if comp_mode == COMP_MODE_PLAIN:

2055

if comp_mode == COMP_MODE_PLAIN:

2056

ladd(c)

2056

ladd(c)

2057

elif comp_mode == COMP_MODE_INLINE:

2057

elif comp_mode == COMP_MODE_INLINE:

2058

ladd(decomp(c))

2058

ladd(decomp(c))

2059

elif comp_mode == COMP_MODE_DEFAULT:

2059

elif comp_mode == COMP_MODE_DEFAULT:

2060

ladd(def_decomp(c))

2060

ladd(def_decomp(c))

2061

else:

2061

else:

2062

msg = b'unknown compression mode %d'

2062

msg = b'unknown compression mode %d'

2063

msg %= comp_mode

2063

msg %= comp_mode

2064

raise error.RevlogError(msg)

2064

raise error.RevlogError(msg)

2065

2066

return l

2066

return l

2067

2068

def deltaparent(self, rev):

2068

def deltaparent(self, rev):

2069

"""return deltaparent of the given revision"""

2069

"""return deltaparent of the given revision"""

2070

base = self.index[rev][3]

2070

base = self.index[rev][3]

2071

if base == rev:

2071

if base == rev:

2072

return nullrev

2072

return nullrev

2073

elif self.delta_config.general_delta:

2073

elif self.delta_config.general_delta:

2074

return base

2074

return base

2075

else:

2075

else:

2076

return rev - 1

2076

return rev - 1

2077

2078

def issnapshot(self, rev):

2078

def issnapshot(self, rev):

2079

"""tells whether rev is a snapshot"""

2079

"""tells whether rev is a snapshot"""

2080

if not self.delta_config.sparse_revlog:

2080

if not self.delta_config.sparse_revlog:

2081

return self.deltaparent(rev) == nullrev

2081

return self.deltaparent(rev) == nullrev

2082

elif hasattr(self.index, 'issnapshot'):

2082

elif hasattr(self.index, 'issnapshot'):

2083

# directly assign the method to cache the testing and access

2083

# directly assign the method to cache the testing and access

2084

self.issnapshot = self.index.issnapshot

2084

self.issnapshot = self.index.issnapshot

2085

return self.issnapshot(rev)

2085

return self.issnapshot(rev)

2086

if rev == nullrev:

2086

if rev == nullrev:

2087

return True

2087

return True

2088

entry = self.index[rev]

2088

entry = self.index[rev]

2089

base = entry[3]

2089

base = entry[3]

2090

if base == rev:

2090

if base == rev:

2091

return True

2091

return True

2092

if base == nullrev:

2092

if base == nullrev:

2093

return True

2093

return True

2094

p1 = entry[5]

2094

p1 = entry[5]

2095

while self.length(p1) == 0:

2095

while self.length(p1) == 0:

2096

b = self.deltaparent(p1)

2096

b = self.deltaparent(p1)

2097

if b == p1:

2097

if b == p1:

2098

break

2098

break

2099

p1 = b

2099

p1 = b

2100

p2 = entry[6]

2100

p2 = entry[6]

2101

while self.length(p2) == 0:

2101

while self.length(p2) == 0:

2102

b = self.deltaparent(p2)

2102

b = self.deltaparent(p2)

2103

if b == p2:

2103

if b == p2:

2104

break

2104

break

2105

p2 = b

2105

p2 = b

2106

if base == p1 or base == p2:

2106

if base == p1 or base == p2:

2107

return False

2107

return False

2108

return self.issnapshot(base)

2108

return self.issnapshot(base)

2109

2110

def snapshotdepth(self, rev):

2110

def snapshotdepth(self, rev):

2111

"""number of snapshot in the chain before this one"""

2111

"""number of snapshot in the chain before this one"""

2112

if not self.issnapshot(rev):

2112

if not self.issnapshot(rev):

2113

raise error.ProgrammingError(b'revision %d not a snapshot')

2113

raise error.ProgrammingError(b'revision %d not a snapshot')

2114

return len(self._deltachain(rev)[0]) - 1

2114

return len(self._deltachain(rev)[0]) - 1

2115

2116

def revdiff(self, rev1, rev2):

2116

def revdiff(self, rev1, rev2):

2117

"""return or calculate a delta between two revisions

2117

"""return or calculate a delta between two revisions

2118

2119

The delta calculated is in binary form and is intended to be written to

2119

The delta calculated is in binary form and is intended to be written to

2120

revlog data directly. So this function needs raw revision data.

2120

revlog data directly. So this function needs raw revision data.

2121

"""

2121

"""

2122

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2122

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2123

return bytes(self._chunk(rev2))

2123

return bytes(self._chunk(rev2))

2124

2125

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2125

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2126

2127

def revision(self, nodeorrev):

2127

def revision(self, nodeorrev):

2128

"""return an uncompressed revision of a given node or revision

2128

"""return an uncompressed revision of a given node or revision

2129

number.

2129

number.

2130

"""

2130

"""

2131

return self._revisiondata(nodeorrev)

2131

return self._revisiondata(nodeorrev)

2132

2133

def sidedata(self, nodeorrev):

2133

def sidedata(self, nodeorrev):

2134

"""a map of extra data related to the changeset but not part of the hash

2134

"""a map of extra data related to the changeset but not part of the hash

2135

2136

This function currently return a dictionary. However, more advanced

2136

This function currently return a dictionary. However, more advanced

2137

mapping object will likely be used in the future for a more

2137

mapping object will likely be used in the future for a more

2138

efficient/lazy code.

2138

efficient/lazy code.

2139

"""

2139

"""

2140

# deal with <nodeorrev> argument type

2140

# deal with <nodeorrev> argument type

2141

if isinstance(nodeorrev, int):

2141

if isinstance(nodeorrev, int):

2142

rev = nodeorrev

2142

rev = nodeorrev

2143

else:

2143

else:

2144

rev = self.rev(nodeorrev)

2144

rev = self.rev(nodeorrev)

2145

return self._sidedata(rev)

2145

return self._sidedata(rev)

2146

2147

def _revisiondata(self, nodeorrev, raw=False):

2147

def _revisiondata(self, nodeorrev, raw=False):

2148

# deal with <nodeorrev> argument type

2148

# deal with <nodeorrev> argument type

2149

if isinstance(nodeorrev, int):

2149

if isinstance(nodeorrev, int):

2150

rev = nodeorrev

2150

rev = nodeorrev

2151

node = self.node(rev)

2151

node = self.node(rev)

2152

else:

2152

else:

2153

node = nodeorrev

2153

node = nodeorrev

2154

rev = None

2154

rev = None

2155

2156

# fast path the special `nullid` rev

2156

# fast path the special `nullid` rev

2157

if node == self.nullid:

2157

if node == self.nullid:

2158

return b""

2158

return b""

2159

2160

# ``rawtext`` is the text as stored inside the revlog. Might be the

2160

# ``rawtext`` is the text as stored inside the revlog. Might be the

2161

# revision or might need to be processed to retrieve the revision.

2161

# revision or might need to be processed to retrieve the revision.

2162

rev, rawtext, validated = self._rawtext(node, rev)

2162

rev, rawtext, validated = self._rawtext(node, rev)

2163

2164

if raw and validated:

2164

if raw and validated:

2165

# if we don't want to process the raw text and that raw

2165

# if we don't want to process the raw text and that raw

2166

# text is cached, we can exit early.

2166

# text is cached, we can exit early.

2167

return rawtext

2167

return rawtext

2168

if rev is None:

2168

if rev is None:

2169

rev = self.rev(node)

2169

rev = self.rev(node)

2170

# the revlog's flag for this revision

2170

# the revlog's flag for this revision

2171

# (usually alter its state or content)

2171

# (usually alter its state or content)

2172

flags = self.flags(rev)

2172

flags = self.flags(rev)

2173

2174

if validated and flags == REVIDX_DEFAULT_FLAGS:

2174

if validated and flags == REVIDX_DEFAULT_FLAGS:

2175

# no extra flags set, no flag processor runs, text = rawtext

2175

# no extra flags set, no flag processor runs, text = rawtext

2176

return rawtext

2176

return rawtext

2177

2178

if raw:

2178

if raw:

2179

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2179

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2180

text = rawtext

2180

text = rawtext

2181

else:

2181

else:

2182

r = flagutil.processflagsread(self, rawtext, flags)

2182

r = flagutil.processflagsread(self, rawtext, flags)

2183

text, validatehash = r

2183

text, validatehash = r

2184

if validatehash:

2184

if validatehash:

2185

self.checkhash(text, node, rev=rev)

2185

self.checkhash(text, node, rev=rev)

2186

if not validated:

2186

if not validated:

2187

self._revisioncache = (node, rev, rawtext)

2187

self._revisioncache = (node, rev, rawtext)

2188

2189

return text

2189

return text

2190

2191

def _rawtext(self, node, rev):

2191

def _rawtext(self, node, rev):

2192

"""return the possibly unvalidated rawtext for a revision

2192

"""return the possibly unvalidated rawtext for a revision

2193

2194

returns (rev, rawtext, validated)

2194

returns (rev, rawtext, validated)

2195

"""

2195

"""

2196

2197

# revision in the cache (could be useful to apply delta)

2197

# revision in the cache (could be useful to apply delta)

2198

cachedrev = None

2198

cachedrev = None

2199

# An intermediate text to apply deltas to

2199

# An intermediate text to apply deltas to

2200

basetext = None

2200

basetext = None

2201

2202

# Check if we have the entry in cache

2202

# Check if we have the entry in cache

2203

# The cache entry looks like (node, rev, rawtext)

2203

# The cache entry looks like (node, rev, rawtext)

2204

if self._revisioncache:

2204

if self._revisioncache:

2205

if self._revisioncache[0] == node:

2205

if self._revisioncache[0] == node:

2206

return (rev, self._revisioncache[2], True)

2206

return (rev, self._revisioncache[2], True)

2207

cachedrev = self._revisioncache[1]

2207

cachedrev = self._revisioncache[1]

2208

2209

if rev is None:

2209

if rev is None:

2210

rev = self.rev(node)

2210

rev = self.rev(node)

2211

2212

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

2212

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

2213

if stopped:

2213

if stopped:

2214

basetext = self._revisioncache[2]

2214

basetext = self._revisioncache[2]

2215

2216

# drop cache to save memory, the caller is expected to

2216

# drop cache to save memory, the caller is expected to

2217

# update self._revisioncache after validating the text

2217

# update self._revisioncache after validating the text

2218

self._revisioncache = None

2218

self._revisioncache = None

2219

2220

targetsize = None

2220

targetsize = None

2221

rawsize = self.index[rev][2]

2221

rawsize = self.index[rev][2]

2222

if 0 <= rawsize:

2222

if 0 <= rawsize:

2223

targetsize = 4 * rawsize

2223

targetsize = 4 * rawsize

2224

2225

bins = self._chunks(chain, targetsize=targetsize)

2225

bins = self._chunks(chain, targetsize=targetsize)

2226

if basetext is None:

2226

if basetext is None:

2227

basetext = bytes(bins[0])

2227

basetext = bytes(bins[0])

2228

bins = bins[1:]

2228

bins = bins[1:]

2229

2230

rawtext = mdiff.patches(basetext, bins)

2230

rawtext = mdiff.patches(basetext, bins)

2231

del basetext # let us have a chance to free memory early

2231

del basetext # let us have a chance to free memory early

2232

return (rev, rawtext, False)

2232

return (rev, rawtext, False)

2233

2234

def _sidedata(self, rev):

2234

def _sidedata(self, rev):

2235

"""Return the sidedata for a given revision number."""

2235

"""Return the sidedata for a given revision number."""

2236

index_entry = self.index[rev]

2236

index_entry = self.index[rev]

2237

sidedata_offset = index_entry[8]

2237

sidedata_offset = index_entry[8]

2238

sidedata_size = index_entry[9]

2238

sidedata_size = index_entry[9]

2239

2240

if self._inline:

2240

if self._inline:

2241

sidedata_offset += self.index.entry_size * (1 + rev)

2241

sidedata_offset += self.index.entry_size * (1 + rev)

2242

if sidedata_size == 0:

2242

if sidedata_size == 0:

2243

return {}

2243

return {}

2244

2245

if self._docket.sidedata_end < sidedata_offset + sidedata_size:

2245

if self._docket.sidedata_end < sidedata_offset + sidedata_size:

2246

filename = self._sidedatafile

2246

filename = self._sidedatafile

2247

end = self._docket.sidedata_end

2247

end = self._docket.sidedata_end

2248

offset = sidedata_offset

2248

offset = sidedata_offset

2249

length = sidedata_size

2249

length = sidedata_size

2250

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

2250

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

2251

raise error.RevlogError(m)

2251

raise error.RevlogError(m)

2252

2253

comp_segment = self._segmentfile_sidedata.read_chunk(

2253

comp_segment = self._segmentfile_sidedata.read_chunk(

2254

sidedata_offset, sidedata_size

2254

sidedata_offset, sidedata_size

2255

)

2255

)

2256

2257

comp = self.index[rev][11]

2257

comp = self.index[rev][11]

2258

if comp == COMP_MODE_PLAIN:

2258

if comp == COMP_MODE_PLAIN:

2259

segment = comp_segment

2259

segment = comp_segment

2260

elif comp == COMP_MODE_DEFAULT:

2260

elif comp == COMP_MODE_DEFAULT:

2261

segment = self._decompressor(comp_segment)

2261

segment = self._decompressor(comp_segment)

2262

elif comp == COMP_MODE_INLINE:

2262

elif comp == COMP_MODE_INLINE:

2263

segment = self.decompress(comp_segment)

2263

segment = self.decompress(comp_segment)

2264

else:

2264

else:

2265

msg = b'unknown compression mode %d'

2265

msg = b'unknown compression mode %d'

2266

msg %= comp

2266

msg %= comp

2267

raise error.RevlogError(msg)

2267

raise error.RevlogError(msg)

2268

2269

sidedata = sidedatautil.deserialize_sidedata(segment)

2269

sidedata = sidedatautil.deserialize_sidedata(segment)

2270

return sidedata

2270

return sidedata

2271

2272

def rawdata(self, nodeorrev):

2272

def rawdata(self, nodeorrev):

2273

"""return an uncompressed raw data of a given node or revision number."""

2273

"""return an uncompressed raw data of a given node or revision number."""

2274

return self._revisiondata(nodeorrev, raw=True)

2274

return self._revisiondata(nodeorrev, raw=True)

2275

2276

def hash(self, text, p1, p2):

2276

def hash(self, text, p1, p2):

2277

"""Compute a node hash.

2277

"""Compute a node hash.

2278

2279

Available as a function so that subclasses can replace the hash

2279

Available as a function so that subclasses can replace the hash

2280

as needed.

2280

as needed.

2281

"""

2281

"""

2282

return storageutil.hashrevisionsha1(text, p1, p2)

2282

return storageutil.hashrevisionsha1(text, p1, p2)

2283

2284

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2284

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2285

"""Check node hash integrity.

2285

"""Check node hash integrity.

2286

2287

Available as a function so that subclasses can extend hash mismatch

2287

Available as a function so that subclasses can extend hash mismatch

2288

behaviors as needed.

2288

behaviors as needed.

2289

"""

2289

"""

2290

try:

2290

try:

2291

if p1 is None and p2 is None:

2291

if p1 is None and p2 is None:

2292

p1, p2 = self.parents(node)

2292

p1, p2 = self.parents(node)

2293

if node != self.hash(text, p1, p2):

2293

if node != self.hash(text, p1, p2):

2294

# Clear the revision cache on hash failure. The revision cache

2294

# Clear the revision cache on hash failure. The revision cache

2295

# only stores the raw revision and clearing the cache does have

2295

# only stores the raw revision and clearing the cache does have

2296

# the side-effect that we won't have a cache hit when the raw

2296

# the side-effect that we won't have a cache hit when the raw

2297

# revision data is accessed. But this case should be rare and

2297

# revision data is accessed. But this case should be rare and

2298

# it is extra work to teach the cache about the hash

2298

# it is extra work to teach the cache about the hash

2299

# verification state.

2299

# verification state.

2300

if self._revisioncache and self._revisioncache[0] == node:

2300

if self._revisioncache and self._revisioncache[0] == node:

2301

self._revisioncache = None

2301

self._revisioncache = None

2302

2303

revornode = rev

2303

revornode = rev

2304

if revornode is None:

2304

if revornode is None:

2305

revornode = templatefilters.short(hex(node))

2305

revornode = templatefilters.short(hex(node))

2306

raise error.RevlogError(

2306

raise error.RevlogError(

2307

_(b"integrity check failed on %s:%s")

2307

_(b"integrity check failed on %s:%s")

2308

% (self.display_id, pycompat.bytestr(revornode))

2308

% (self.display_id, pycompat.bytestr(revornode))

2309

)

2309

)

2310

except error.RevlogError:

2310

except error.RevlogError:

2311

if self.feature_config.censorable and storageutil.iscensoredtext(

2311

if self.feature_config.censorable and storageutil.iscensoredtext(

2312

text

2312

text

2313

):

2313

):

2314

raise error.CensoredNodeError(self.display_id, node, text)

2314

raise error.CensoredNodeError(self.display_id, node, text)

2315

raise

2315

raise

2316

2317

@property

2317

@property

2318

def _split_index_file(self):

2318

def _split_index_file(self):

2319

"""the path where to expect the index of an ongoing splitting operation

2319

"""the path where to expect the index of an ongoing splitting operation

2320

2321

The file will only exist if a splitting operation is in progress, but

2321

The file will only exist if a splitting operation is in progress, but

2322

it is always expected at the same location."""

2322

it is always expected at the same location."""

2323

parts = self.radix.split(b'/')

2323

parts = self.radix.split(b'/')

2324

if len(parts) > 1:

2324

if len(parts) > 1:

2325

# adds a '-s' prefix to the ``data/` or `meta/` base

2325

# adds a '-s' prefix to the ``data/` or `meta/` base

2326

head = parts[0] + b'-s'

2326

head = parts[0] + b'-s'

2327

mids = parts[1:-1]

2327

mids = parts[1:-1]

2328

tail = parts[-1] + b'.i'

2328

tail = parts[-1] + b'.i'

2329

pieces = [head] + mids + [tail]

2329

pieces = [head] + mids + [tail]

2330

return b'/'.join(pieces)

2330

return b'/'.join(pieces)

2331

else:

2331

else:

2332

# the revlog is stored at the root of the store (changelog or

2332

# the revlog is stored at the root of the store (changelog or

2333

# manifest), no risk of collision.

2333

# manifest), no risk of collision.

2334

return self.radix + b'.i.s'

2334

return self.radix + b'.i.s'

2335

2336

def _enforceinlinesize(self, tr, side_write=True):

2336

def _enforceinlinesize(self, tr, side_write=True):

2337

"""Check if the revlog is too big for inline and convert if so.

2337

"""Check if the revlog is too big for inline and convert if so.

2338

2339

This should be called after revisions are added to the revlog. If the

2339

This should be called after revisions are added to the revlog. If the

2340

revlog has grown too large to be an inline revlog, it will convert it

2340

revlog has grown too large to be an inline revlog, it will convert it

2341

to use multiple index and data files.

2341

to use multiple index and data files.

2342

"""

2342

"""

2343

tiprev = len(self) - 1

2343

tiprev = len(self) - 1

2344

total_size = self.start(tiprev) + self.length(tiprev)

2344

total_size = self.start(tiprev) + self.length(tiprev)

2345

if not self._inline or total_size < _maxinline:

2345

if not self._inline or total_size < _maxinline:

2346

return

2346

return

2347

2348

troffset = tr.findoffset(self._indexfile)

2348

troffset = tr.findoffset(self._indexfile)

2349

if troffset is None:

2349

if troffset is None:

2350

raise error.RevlogError(

2350

raise error.RevlogError(

2351

_(b"%s not found in the transaction") % self._indexfile

2351

_(b"%s not found in the transaction") % self._indexfile

2352

)

2352

)

2353

if troffset:

2353

if troffset:

2354

tr.addbackup(self._indexfile, for_offset=True)

2354

tr.addbackup(self._indexfile, for_offset=True)

2355

tr.add(self._datafile, 0)

2355

tr.add(self._datafile, 0)

2356

2357

existing_handles = False

2357

existing_handles = False

2358

if self._writinghandles is not None:

2358

if self._writinghandles is not None:

2359

existing_handles = True

2359

existing_handles = True

2360

fp = self._writinghandles[0]

2360

fp = self._writinghandles[0]

2361

fp.flush()

2361

fp.flush()

2362

fp.close()

2362

fp.close()

2363

# We can't use the cached file handle after close(). So prevent

2363

# We can't use the cached file handle after close(). So prevent

2364

# its usage.

2364

# its usage.

2365

self._writinghandles = None

2365

self._writinghandles = None

2366

self._segmentfile.writing_handle = None

2366

self._segmentfile.writing_handle = None

2367

# No need to deal with sidedata writing handle as it is only

2367

# No need to deal with sidedata writing handle as it is only

2368

# relevant with revlog-v2 which is never inline, not reaching

2368

# relevant with revlog-v2 which is never inline, not reaching

2369

# this code

2369

# this code

2370

if side_write:

2370

if side_write:

2371

old_index_file_path = self._indexfile

2371

old_index_file_path = self._indexfile

2372

new_index_file_path = self._split_index_file

2372

new_index_file_path = self._split_index_file

2373

opener = self.opener

2373

opener = self.opener

2374

weak_self = weakref.ref(self)

2374

weak_self = weakref.ref(self)

2375

2376

# the "split" index replace the real index when the transaction is finalized

2376

# the "split" index replace the real index when the transaction is finalized

2377

def finalize_callback(tr):

2377

def finalize_callback(tr):

2378

opener.rename(

2378

opener.rename(

2379

new_index_file_path,

2379

new_index_file_path,

2380

old_index_file_path,

2380

old_index_file_path,

2381

checkambig=True,

2381

checkambig=True,

2382

)

2382

)

2383

maybe_self = weak_self()

2383

maybe_self = weak_self()

2384

if maybe_self is not None:

2384

if maybe_self is not None:

2385

maybe_self._indexfile = old_index_file_path

2385

maybe_self._indexfile = old_index_file_path

2386

2387

def abort_callback(tr):

2387

def abort_callback(tr):

2388

maybe_self = weak_self()

2388

maybe_self = weak_self()

2389

if maybe_self is not None:

2389

if maybe_self is not None:

2390

maybe_self._indexfile = old_index_file_path

2390

maybe_self._indexfile = old_index_file_path

2391

2392

tr.registertmp(new_index_file_path)

2392

tr.registertmp(new_index_file_path)

2393

if self.target[1] is not None:

2393

if self.target[1] is not None:

2394

callback_id = b'000-revlog-split-%d-%s' % self.target

2394

callback_id = b'000-revlog-split-%d-%s' % self.target

2395

else:

2395

else:

2396

callback_id = b'000-revlog-split-%d' % self.target[0]

2396

callback_id = b'000-revlog-split-%d' % self.target[0]

2397

tr.addfinalize(callback_id, finalize_callback)

2397

tr.addfinalize(callback_id, finalize_callback)

2398

tr.addabort(callback_id, abort_callback)

2398

tr.addabort(callback_id, abort_callback)

2399

2400

new_dfh = self._datafp(b'w+')

2400

new_dfh = self._datafp(b'w+')

2401

new_dfh.truncate(0) # drop any potentially existing data

2401

new_dfh.truncate(0) # drop any potentially existing data

2402

try:

2402

try:

2403

with self.reading():

2403

with self.reading():

2404

for r in self:

2404

for r in self:

2405

new_dfh.write(self._getsegmentforrevs(r, r)[1])

2405

new_dfh.write(self._getsegmentforrevs(r, r)[1])

2406

new_dfh.flush()

2406

new_dfh.flush()

2407

2408

if side_write:

2408

if side_write:

2409

self._indexfile = new_index_file_path

2409

self._indexfile = new_index_file_path

2410

with self.__index_new_fp() as fp:

2410

with self.__index_new_fp() as fp:

2411

self._format_flags &= ~FLAG_INLINE_DATA

2411

self._format_flags &= ~FLAG_INLINE_DATA

2412

self._inline = False

2412

self._inline = False

2413

for i in self:

2413

for i in self:

2414

e = self.index.entry_binary(i)

2414

e = self.index.entry_binary(i)

2415

if i == 0 and self._docket is None:

2415

if i == 0 and self._docket is None:

2416

header = self._format_flags | self._format_version

2416

header = self._format_flags | self._format_version

2417

header = self.index.pack_header(header)

2417

header = self.index.pack_header(header)

2418

e = header + e

2418

e = header + e

2419

fp.write(e)

2419

fp.write(e)

2420

if self._docket is not None:

2420

if self._docket is not None:

2421

self._docket.index_end = fp.tell()

2421

self._docket.index_end = fp.tell()

2422

2423

# If we don't use side-write, the temp file replace the real

2423

# If we don't use side-write, the temp file replace the real

2424

# index when we exit the context manager

2424

# index when we exit the context manager

2425

2426

nodemaputil.setup_persistent_nodemap(tr, self)

2426

nodemaputil.setup_persistent_nodemap(tr, self)

2427

self._segmentfile = randomaccessfile.randomaccessfile(

2427

self._segmentfile = randomaccessfile.randomaccessfile(

2428

self.opener,

2428

self.opener,

2429

self._datafile,

2429

self._datafile,

2430

self.data_config.chunk_cache_size,

2430

self.data_config.chunk_cache_size,

2431

)

2431

)

2432

2433

if existing_handles:

2433

if existing_handles:

2434

# switched from inline to conventional reopen the index

2434

# switched from inline to conventional reopen the index

2435

ifh = self.__index_write_fp()

2435

ifh = self.__index_write_fp()

2436

self._writinghandles = (ifh, new_dfh, None)

2436

self._writinghandles = (ifh, new_dfh, None)

2437

self._segmentfile.writing_handle = new_dfh

2437

self._segmentfile.writing_handle = new_dfh

2438

new_dfh = None

2438

new_dfh = None

2439

# No need to deal with sidedata writing handle as it is only

2439

# No need to deal with sidedata writing handle as it is only

2440

# relevant with revlog-v2 which is never inline, not reaching

2440

# relevant with revlog-v2 which is never inline, not reaching

2441

# this code

2441

# this code

2442

finally:

2442

finally:

2443

if new_dfh is not None:

2443

if new_dfh is not None:

2444

new_dfh.close()

2444

new_dfh.close()

2445

2446

def _nodeduplicatecallback(self, transaction, node):

2446

def _nodeduplicatecallback(self, transaction, node):

2447

"""called when trying to add a node already stored."""

2447

"""called when trying to add a node already stored."""

2448

2449

@contextlib.contextmanager

2449

@contextlib.contextmanager

2450

def reading(self):

2450

def reading(self):

2451

"""Context manager that keeps data and sidedata files open for reading"""

2451

"""Context manager that keeps data and sidedata files open for reading"""

2452

if len(self.index) == 0:

2452

if len(self.index) == 0:

2453

yield # nothing to be read

2453

yield # nothing to be read

2454

else:

2454

else:

2455

with self._segmentfile.reading():

2455

with self._segmentfile.reading():

2456

with self._segmentfile_sidedata.reading():

2456

with self._segmentfile_sidedata.reading():

2457

yield

2457

yield

2458

2459

@contextlib.contextmanager

2459

@contextlib.contextmanager

2460

def _writing(self, transaction):

2460

def _writing(self, transaction):

2461

if self._trypending:

2461

if self._trypending:

2462

msg = b'try to write in a `trypending` revlog: %s'

2462

msg = b'try to write in a `trypending` revlog: %s'

2463

msg %= self.display_id

2463

msg %= self.display_id

2464

raise error.ProgrammingError(msg)

2464

raise error.ProgrammingError(msg)

2465

if self._writinghandles is not None:

2465

if self._writinghandles is not None:

2466

yield

2466

yield

2467

else:

2467

else:

2468

ifh = dfh = sdfh = None

2468

ifh = dfh = sdfh = None

2469

try:

2469

try:

2470

r = len(self)

2470

r = len(self)

2471

# opening the data file.

2471

# opening the data file.

2472

dsize = 0

2472

dsize = 0

2473

if r:

2473

if r:

2474

dsize = self.end(r - 1)

2474

dsize = self.end(r - 1)

2475

dfh = None

2475

dfh = None

2476

if not self._inline:

2476

if not self._inline:

2477

try:

2477

try:

2478

dfh = self._datafp(b"r+")

2478

dfh = self._datafp(b"r+")

2479

if self._docket is None:

2479

if self._docket is None:

2480

dfh.seek(0, os.SEEK_END)

2480

dfh.seek(0, os.SEEK_END)

2481

else:

2481

else:

2482

dfh.seek(self._docket.data_end, os.SEEK_SET)

2482

dfh.seek(self._docket.data_end, os.SEEK_SET)

2483

except FileNotFoundError:

2483

except FileNotFoundError:

2484

dfh = self._datafp(b"w+")

2484

dfh = self._datafp(b"w+")

2485

transaction.add(self._datafile, dsize)

2485

transaction.add(self._datafile, dsize)

2486

if self._sidedatafile is not None:

2486

if self._sidedatafile is not None:

2487

# revlog-v2 does not inline, help Pytype

2487

# revlog-v2 does not inline, help Pytype

2488

assert dfh is not None

2488

assert dfh is not None

2489

try:

2489

try:

2490

sdfh = self.opener(self._sidedatafile, mode=b"r+")

2490

sdfh = self.opener(self._sidedatafile, mode=b"r+")

2491

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

2491

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

2492

except FileNotFoundError:

2492

except FileNotFoundError:

2493

sdfh = self.opener(self._sidedatafile, mode=b"w+")

2493

sdfh = self.opener(self._sidedatafile, mode=b"w+")

2494

transaction.add(

2494

transaction.add(

2495

self._sidedatafile, self._docket.sidedata_end

2495

self._sidedatafile, self._docket.sidedata_end

2496

)

2496

)

2497

2498

# opening the index file.

2498

# opening the index file.

2499

isize = r * self.index.entry_size

2499

isize = r * self.index.entry_size

2500

ifh = self.__index_write_fp()

2500

ifh = self.__index_write_fp()

2501

if self._inline:

2501

if self._inline:

2502

transaction.add(self._indexfile, dsize + isize)

2502

transaction.add(self._indexfile, dsize + isize)

2503

else:

2503

else:

2504

transaction.add(self._indexfile, isize)

2504

transaction.add(self._indexfile, isize)

2505

# exposing all file handle for writing.

2505

# exposing all file handle for writing.

2506

self._writinghandles = (ifh, dfh, sdfh)

2506

self._writinghandles = (ifh, dfh, sdfh)

2507

self._segmentfile.writing_handle = ifh if self._inline else dfh

2507

self._segmentfile.writing_handle = ifh if self._inline else dfh

2508

self._segmentfile_sidedata.writing_handle = sdfh

2508

self._segmentfile_sidedata.writing_handle = sdfh

2509

yield

2509

yield

2510

if self._docket is not None:

2510

if self._docket is not None:

2511

self._write_docket(transaction)

2511

self._write_docket(transaction)

2512

finally:

2512

finally:

2513

self._writinghandles = None

2513

self._writinghandles = None

2514

self._segmentfile.writing_handle = None

2514

self._segmentfile.writing_handle = None

2515

self._segmentfile_sidedata.writing_handle = None

2515

self._segmentfile_sidedata.writing_handle = None

2516

if dfh is not None:

2516

if dfh is not None:

2517

dfh.close()

2517

dfh.close()

2518

if sdfh is not None:

2518

if sdfh is not None:

2519

sdfh.close()

2519

sdfh.close()

2520

# closing the index file last to avoid exposing referent to

2520

# closing the index file last to avoid exposing referent to

2521

# potential unflushed data content.

2521

# potential unflushed data content.

2522

if ifh is not None:

2522

if ifh is not None:

2523

ifh.close()

2523

ifh.close()

2524

2525

def _write_docket(self, transaction):

2525

def _write_docket(self, transaction):

2526

"""write the current docket on disk

2526

"""write the current docket on disk

2527

2528

Exist as a method to help changelog to implement transaction logic

2528

Exist as a method to help changelog to implement transaction logic

2529

2530

We could also imagine using the same transaction logic for all revlog

2530

We could also imagine using the same transaction logic for all revlog

2531

since docket are cheap."""

2531

since docket are cheap."""

2532

self._docket.write(transaction)

2532

self._docket.write(transaction)

2533

2534

def addrevision(

2534

def addrevision(

2535

self,

2535

self,

2536

text,

2536

text,

2537

transaction,

2537

transaction,

2538

link,

2538

link,

2539

p1,

2539

p1,

2540

p2,

2540

p2,

2541

cachedelta=None,

2541

cachedelta=None,

2542

node=None,

2542

node=None,

2543

flags=REVIDX_DEFAULT_FLAGS,

2543

flags=REVIDX_DEFAULT_FLAGS,

2544

deltacomputer=None,

2544

deltacomputer=None,

2545

sidedata=None,

2545

sidedata=None,

2546

):

2546

):

2547

"""add a revision to the log

2547

"""add a revision to the log

2548

2549

text - the revision data to add

2549

text - the revision data to add

2550

transaction - the transaction object used for rollback

2550

transaction - the transaction object used for rollback

2551

link - the linkrev data to add

2551

link - the linkrev data to add

2552

p1, p2 - the parent nodeids of the revision

2552

p1, p2 - the parent nodeids of the revision

2553

cachedelta - an optional precomputed delta

2553

cachedelta - an optional precomputed delta

2554

node - nodeid of revision; typically node is not specified, and it is

2554

node - nodeid of revision; typically node is not specified, and it is

2555

computed by default as hash(text, p1, p2), however subclasses might

2555

computed by default as hash(text, p1, p2), however subclasses might

2556

use different hashing method (and override checkhash() in such case)

2556

use different hashing method (and override checkhash() in such case)

2557

flags - the known flags to set on the revision

2557

flags - the known flags to set on the revision

2558

deltacomputer - an optional deltacomputer instance shared between

2558

deltacomputer - an optional deltacomputer instance shared between

2559

multiple calls

2559

multiple calls

2560

"""

2560

"""

2561

if link == nullrev:

2561

if link == nullrev:

2562

raise error.RevlogError(

2562

raise error.RevlogError(

2563

_(b"attempted to add linkrev -1 to %s") % self.display_id

2563

_(b"attempted to add linkrev -1 to %s") % self.display_id

2564

)

2564

)

2565

2566

if sidedata is None:

2566

if sidedata is None:

2567

sidedata = {}

2567

sidedata = {}

2568

elif sidedata and not self.feature_config.has_side_data:

2568

elif sidedata and not self.feature_config.has_side_data:

2569

raise error.ProgrammingError(

2569

raise error.ProgrammingError(

2570

_(b"trying to add sidedata to a revlog who don't support them")

2570

_(b"trying to add sidedata to a revlog who don't support them")

2571

)

2571

)

2572

2573

if flags:

2573

if flags:

2574

node = node or self.hash(text, p1, p2)

2574

node = node or self.hash(text, p1, p2)

2575

2576

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2576

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2577

2578

# If the flag processor modifies the revision data, ignore any provided

2578

# If the flag processor modifies the revision data, ignore any provided

2579

# cachedelta.

2579

# cachedelta.

2580

if rawtext != text:

2580

if rawtext != text:

2581

cachedelta = None

2581

cachedelta = None

2582

2583

if len(rawtext) > _maxentrysize:

2583

if len(rawtext) > _maxentrysize:

2584

raise error.RevlogError(

2584

raise error.RevlogError(

2585

_(

2585

_(

2586

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2586

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2587

)

2587

)

2588

% (self.display_id, len(rawtext))

2588

% (self.display_id, len(rawtext))

2589

)

2589

)

2590

2591

node = node or self.hash(rawtext, p1, p2)

2591

node = node or self.hash(rawtext, p1, p2)

2592

rev = self.index.get_rev(node)

2592

rev = self.index.get_rev(node)

2593

if rev is not None:

2593

if rev is not None:

2594

return rev

2594

return rev

2595

2596

if validatehash:

2596

if validatehash:

2597

self.checkhash(rawtext, node, p1=p1, p2=p2)

2597

self.checkhash(rawtext, node, p1=p1, p2=p2)

2598

2599

return self.addrawrevision(

2599

return self.addrawrevision(

2600

rawtext,

2600

rawtext,

2601

transaction,

2601

transaction,

2602

link,

2602

link,

2603

p1,

2603

p1,

2604

p2,

2604

p2,

2605

node,

2605

node,

2606

flags,

2606

flags,

2607

cachedelta=cachedelta,

2607

cachedelta=cachedelta,

2608

deltacomputer=deltacomputer,

2608

deltacomputer=deltacomputer,

2609

sidedata=sidedata,

2609

sidedata=sidedata,

2610

)

2610

)

2611

2612

def addrawrevision(

2612

def addrawrevision(

2613

self,

2613

self,

2614

rawtext,

2614

rawtext,

2615

transaction,

2615

transaction,

2616

link,

2616

link,

2617

p1,

2617

p1,

2618

p2,

2618

p2,

2619

node,

2619

node,

2620

flags,

2620

flags,

2621

cachedelta=None,

2621

cachedelta=None,

2622

deltacomputer=None,

2622

deltacomputer=None,

2623

sidedata=None,

2623

sidedata=None,

2624

):

2624

):

2625

"""add a raw revision with known flags, node and parents

2625

"""add a raw revision with known flags, node and parents

2626

useful when reusing a revision not stored in this revlog (ex: received

2626

useful when reusing a revision not stored in this revlog (ex: received

2627

over wire, or read from an external bundle).

2627

over wire, or read from an external bundle).

2628

"""

2628

"""

2629

with self._writing(transaction):

2629

with self._writing(transaction):

2630

return self._addrevision(

2630

return self._addrevision(

2631

node,

2631

node,

2632

rawtext,

2632

rawtext,

2633

transaction,

2633

transaction,

2634

link,

2634

link,

2635

p1,

2635

p1,

2636

p2,

2636

p2,

2637

flags,

2637

flags,

2638

cachedelta,

2638

cachedelta,

2639

deltacomputer=deltacomputer,

2639

deltacomputer=deltacomputer,

2640

sidedata=sidedata,

2640

sidedata=sidedata,

2641

)

2641

)

2642

2643

def compress(self, data):

2643

def compress(self, data):

2644

"""Generate a possibly-compressed representation of data."""

2644

"""Generate a possibly-compressed representation of data."""

2645

if not data:

2645

if not data:

2646

return b'', data

2646

return b'', data

2647

2648

compressed = self._compressor.compress(data)

2648

compressed = self._compressor.compress(data)

2649

2650

if compressed:

2650

if compressed:

2651

# The revlog compressor added the header in the returned data.

2651

# The revlog compressor added the header in the returned data.

2652

return b'', compressed

2652

return b'', compressed

2653

2654

if data[0:1] == b'\0':

2654

if data[0:1] == b'\0':

2655

return b'', data

2655

return b'', data

2656

return b'u', data

2656

return b'u', data

2657

2658

def decompress(self, data):

2658

def decompress(self, data):

2659

"""Decompress a revlog chunk.

2659

"""Decompress a revlog chunk.

2660

2661

The chunk is expected to begin with a header identifying the

2661

The chunk is expected to begin with a header identifying the

2662

format type so it can be routed to an appropriate decompressor.

2662

format type so it can be routed to an appropriate decompressor.

2663

"""

2663

"""

2664

if not data:

2664

if not data:

2665

return data

2665

return data

2666

2667

# Revlogs are read much more frequently than they are written and many

2667

# Revlogs are read much more frequently than they are written and many

2668

# chunks only take microseconds to decompress, so performance is

2668

# chunks only take microseconds to decompress, so performance is

2669

# important here.

2669

# important here.

2670

#

2670

#

2671

# We can make a few assumptions about revlogs:

2671

# We can make a few assumptions about revlogs:

2672

#

2672

#

2673

# 1) the majority of chunks will be compressed (as opposed to inline

2673

# 1) the majority of chunks will be compressed (as opposed to inline

2674

# raw data).

2674

# raw data).

2675

# 2) decompressing *any* data will likely by at least 10x slower than

2675

# 2) decompressing *any* data will likely by at least 10x slower than

2676

# returning raw inline data.

2676

# returning raw inline data.

2677

# 3) we want to prioritize common and officially supported compression

2677

# 3) we want to prioritize common and officially supported compression

2678

# engines

2678

# engines

2679

#

2679

#

2680

# It follows that we want to optimize for "decompress compressed data

2680

# It follows that we want to optimize for "decompress compressed data

2681

# when encoded with common and officially supported compression engines"

2681

# when encoded with common and officially supported compression engines"

2682

# case over "raw data" and "data encoded by less common or non-official

2682

# case over "raw data" and "data encoded by less common or non-official

2683

# compression engines." That is why we have the inline lookup first

2683

# compression engines." That is why we have the inline lookup first

2684

# followed by the compengines lookup.

2684

# followed by the compengines lookup.

2685

#

2685

#

2686

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

2686

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

2687

# compressed chunks. And this matters for changelog and manifest reads.

2687

# compressed chunks. And this matters for changelog and manifest reads.

2688

t = data[0:1]

2688

t = data[0:1]

2689

2690

if t == b'x':

2690

if t == b'x':

2691

try:

2691

try:

2692

return _zlibdecompress(data)

2692

return _zlibdecompress(data)

2693

except zlib.error as e:

2693

except zlib.error as e:

2694

raise error.RevlogError(

2694

raise error.RevlogError(

2695

_(b'revlog decompress error: %s')

2695

_(b'revlog decompress error: %s')

2696

% stringutil.forcebytestr(e)

2696

% stringutil.forcebytestr(e)

2697

)

2697

)

2698

# '\0' is more common than 'u' so it goes first.

2698

# '\0' is more common than 'u' so it goes first.

2699

elif t == b'\0':

2699

elif t == b'\0':

2700

return data

2700

return data

2701

elif t == b'u':

2701

elif t == b'u':

2702

return util.buffer(data, 1)

2702

return util.buffer(data, 1)

2703

2704

compressor = self._get_decompressor(t)

2704

compressor = self._get_decompressor(t)

2705

2706

return compressor.decompress(data)

2706

return compressor.decompress(data)

2707

2708

def _addrevision(

2708

def _addrevision(

2709

self,

2709

self,

2710

node,

2710

node,

2711

rawtext,

2711

rawtext,

2712

transaction,

2712

transaction,

2713

link,

2713

link,

2714

p1,

2714

p1,

2715

p2,

2715

p2,

2716

flags,

2716

flags,

2717

cachedelta,

2717

cachedelta,

2718

alwayscache=False,

2718

alwayscache=False,

2719

deltacomputer=None,

2719

deltacomputer=None,

2720

sidedata=None,

2720

sidedata=None,

2721

):

2721

):

2722

"""internal function to add revisions to the log

2722

"""internal function to add revisions to the log

2723

2724

see addrevision for argument descriptions.

2724

see addrevision for argument descriptions.

2725

2726

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

2726

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

2727

2728

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

2728

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

2729

be used.

2729

be used.

2730

2731

invariants:

2731

invariants:

2732

- rawtext is optional (can be None); if not set, cachedelta must be set.

2732

- rawtext is optional (can be None); if not set, cachedelta must be set.

2733

if both are set, they must correspond to each other.

2733

if both are set, they must correspond to each other.

2734

"""

2734

"""

2735

if node == self.nullid:

2735

if node == self.nullid:

2736

raise error.RevlogError(

2736

raise error.RevlogError(

2737

_(b"%s: attempt to add null revision") % self.display_id

2737

_(b"%s: attempt to add null revision") % self.display_id

2738

)

2738

)

2739

if (

2739

if (

2740

node == self.nodeconstants.wdirid

2740

node == self.nodeconstants.wdirid

2741

or node in self.nodeconstants.wdirfilenodeids

2741

or node in self.nodeconstants.wdirfilenodeids

2742

):

2742

):

2743

raise error.RevlogError(

2743

raise error.RevlogError(

2744

_(b"%s: attempt to add wdir revision") % self.display_id

2744

_(b"%s: attempt to add wdir revision") % self.display_id

2745

)

2745

)

2746

if self._writinghandles is None:

2746

if self._writinghandles is None:

2747

msg = b'adding revision outside `revlog._writing` context'

2747

msg = b'adding revision outside `revlog._writing` context'

2748

raise error.ProgrammingError(msg)

2748

raise error.ProgrammingError(msg)

2749

2750

btext = [rawtext]

2750

btext = [rawtext]

2751

2752

curr = len(self)

2752

curr = len(self)

2753

prev = curr - 1

2753

prev = curr - 1

2754

2755

offset = self._get_data_offset(prev)

2755

offset = self._get_data_offset(prev)

2756

2757

if self._concurrencychecker:

2757

if self._concurrencychecker:

2758

ifh, dfh, sdfh = self._writinghandles

2758

ifh, dfh, sdfh = self._writinghandles

2759

# XXX no checking for the sidedata file

2759

# XXX no checking for the sidedata file

2760

if self._inline:

2760

if self._inline:

2761

# offset is "as if" it were in the .d file, so we need to add on

2761

# offset is "as if" it were in the .d file, so we need to add on

2762

# the size of the entry metadata.

2762

# the size of the entry metadata.

2763

self._concurrencychecker(

2763

self._concurrencychecker(

2764

ifh, self._indexfile, offset + curr * self.index.entry_size

2764

ifh, self._indexfile, offset + curr * self.index.entry_size

2765

)

2765

)

2766

else:

2766

else:

2767

# Entries in the .i are a consistent size.

2767

# Entries in the .i are a consistent size.

2768

self._concurrencychecker(

2768

self._concurrencychecker(

2769

ifh, self._indexfile, curr * self.index.entry_size

2769

ifh, self._indexfile, curr * self.index.entry_size

2770

)

2770

)

2771

self._concurrencychecker(dfh, self._datafile, offset)

2771

self._concurrencychecker(dfh, self._datafile, offset)

2772

2773

p1r, p2r = self.rev(p1), self.rev(p2)

2773

p1r, p2r = self.rev(p1), self.rev(p2)

2774

2775

# full versions are inserted when the needed deltas

2775

# full versions are inserted when the needed deltas

2776

# become comparable to the uncompressed text

2776

# become comparable to the uncompressed text

2777

if rawtext is None:

2777

if rawtext is None:

2778

# need rawtext size, before changed by flag processors, which is

2778

# need rawtext size, before changed by flag processors, which is

2779

# the non-raw size. use revlog explicitly to avoid filelog's extra

2779

# the non-raw size. use revlog explicitly to avoid filelog's extra

2780

# logic that might remove metadata size.

2780

# logic that might remove metadata size.

2781

textlen = mdiff.patchedsize(

2781

textlen = mdiff.patchedsize(

2782

revlog.size(self, cachedelta[0]), cachedelta[1]

2782

revlog.size(self, cachedelta[0]), cachedelta[1]

2783

)

2783

)

2784

else:

2784

else:

2785

textlen = len(rawtext)

2785

textlen = len(rawtext)

2786

2787

if deltacomputer is None:

2787

if deltacomputer is None:

2788

write_debug = None

2788

write_debug = None

2789

if self.delta_config.debug_delta:

2789

if self.delta_config.debug_delta:

2790

write_debug = transaction._report

2790

write_debug = transaction._report

2791

deltacomputer = deltautil.deltacomputer(

2791

deltacomputer = deltautil.deltacomputer(

2792

self, write_debug=write_debug

2792

self, write_debug=write_debug

2793

)

2793

)

2794

2795

if cachedelta is not None and len(cachedelta) == 2:

2795

if cachedelta is not None and len(cachedelta) == 2:

2796

# If the cached delta has no information about how it should be

2796

# If the cached delta has no information about how it should be

2797

# reused, add the default reuse instruction according to the

2797

# reused, add the default reuse instruction according to the

2798

# revlog's configuration.

2798

# revlog's configuration.

2799

if (

2799

if (

2800

self.delta_config.general_delta

2800

self.delta_config.general_delta

2801

and self.delta_config.lazy_delta_base

2801

and self.delta_config.lazy_delta_base

2802

):

2802

):

2803

delta_base_reuse = DELTA_BASE_REUSE_TRY

2803

delta_base_reuse = DELTA_BASE_REUSE_TRY

2804

else:

2804

else:

2805

delta_base_reuse = DELTA_BASE_REUSE_NO

2805

delta_base_reuse = DELTA_BASE_REUSE_NO

2806

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

2806

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

2807

2808

revinfo = revlogutils.revisioninfo(

2808

revinfo = revlogutils.revisioninfo(

2809

node,

2809

node,

2810

p1,

2810

p1,

2811

p2,

2811

p2,

2812

btext,

2812

btext,

2813

textlen,

2813

textlen,

2814

cachedelta,

2814

cachedelta,

2815

flags,

2815

flags,

2816

)

2816

)

2817

2818

deltainfo = deltacomputer.finddeltainfo(revinfo)

2818

deltainfo = deltacomputer.finddeltainfo(revinfo)

2819

2820

compression_mode = COMP_MODE_INLINE

2820

compression_mode = COMP_MODE_INLINE

2821

if self._docket is not None:

2821

if self._docket is not None:

2822

default_comp = self._docket.default_compression_header

2822

default_comp = self._docket.default_compression_header

2823

r = deltautil.delta_compression(default_comp, deltainfo)

2823

r = deltautil.delta_compression(default_comp, deltainfo)

2824

compression_mode, deltainfo = r

2824

compression_mode, deltainfo = r

2825

2826

sidedata_compression_mode = COMP_MODE_INLINE

2826

sidedata_compression_mode = COMP_MODE_INLINE

2827

if sidedata and self.feature_config.has_side_data:

2827

if sidedata and self.feature_config.has_side_data:

2828

sidedata_compression_mode = COMP_MODE_PLAIN

2828

sidedata_compression_mode = COMP_MODE_PLAIN

2829

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

2829

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

2830

sidedata_offset = self._docket.sidedata_end

2830

sidedata_offset = self._docket.sidedata_end

2831

h, comp_sidedata = self.compress(serialized_sidedata)

2831

h, comp_sidedata = self.compress(serialized_sidedata)

2832

if (

2832

if (

2833

h != b'u'

2833

h != b'u'

2834

and comp_sidedata[0:1] != b'\0'

2834

and comp_sidedata[0:1] != b'\0'

2835

and len(comp_sidedata) < len(serialized_sidedata)

2835

and len(comp_sidedata) < len(serialized_sidedata)

2836

):

2836

):

2837

assert not h

2837

assert not h

2838

if (

2838

if (

2839

comp_sidedata[0:1]

2839

comp_sidedata[0:1]

2840

== self._docket.default_compression_header

2840

== self._docket.default_compression_header

2841

):

2841

):

2842

sidedata_compression_mode = COMP_MODE_DEFAULT

2842

sidedata_compression_mode = COMP_MODE_DEFAULT

2843

serialized_sidedata = comp_sidedata

2843

serialized_sidedata = comp_sidedata

2844

else:

2844

else:

2845

sidedata_compression_mode = COMP_MODE_INLINE

2845

sidedata_compression_mode = COMP_MODE_INLINE

2846

serialized_sidedata = comp_sidedata

2846

serialized_sidedata = comp_sidedata

2847

else:

2847

else:

2848

serialized_sidedata = b""

2848

serialized_sidedata = b""

2849

# Don't store the offset if the sidedata is empty, that way

2849

# Don't store the offset if the sidedata is empty, that way

2850

# we can easily detect empty sidedata and they will be no different

2850

# we can easily detect empty sidedata and they will be no different

2851

# than ones we manually add.

2851

# than ones we manually add.

2852

sidedata_offset = 0

2852

sidedata_offset = 0

2853

2854

rank = RANK_UNKNOWN

2854

rank = RANK_UNKNOWN

2855

if self._compute_rank:

2855

if self.feature_config.compute_rank:

2856

if (p1r, p2r) == (nullrev, nullrev):

2856

if (p1r, p2r) == (nullrev, nullrev):

2857

rank = 1

2857

rank = 1

2858

elif p1r != nullrev and p2r == nullrev:

2858

elif p1r != nullrev and p2r == nullrev:

2859

rank = 1 + self.fast_rank(p1r)

2859

rank = 1 + self.fast_rank(p1r)

2860

elif p1r == nullrev and p2r != nullrev:

2860

elif p1r == nullrev and p2r != nullrev:

2861

rank = 1 + self.fast_rank(p2r)

2861

rank = 1 + self.fast_rank(p2r)

2862

else: # merge node

2862

else: # merge node

2863

if rustdagop is not None and self.index.rust_ext_compat:

2863

if rustdagop is not None and self.index.rust_ext_compat:

2864

rank = rustdagop.rank(self.index, p1r, p2r)

2864

rank = rustdagop.rank(self.index, p1r, p2r)

2865

else:

2865

else:

2866

pmin, pmax = sorted((p1r, p2r))

2866

pmin, pmax = sorted((p1r, p2r))

2867

rank = 1 + self.fast_rank(pmax)

2867

rank = 1 + self.fast_rank(pmax)

2868

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

2868

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

2869

2870

e = revlogutils.entry(

2870

e = revlogutils.entry(

2871

flags=flags,

2871

flags=flags,

2872

data_offset=offset,

2872

data_offset=offset,

2873

data_compressed_length=deltainfo.deltalen,

2873

data_compressed_length=deltainfo.deltalen,

2874

data_uncompressed_length=textlen,

2874

data_uncompressed_length=textlen,

2875

data_compression_mode=compression_mode,

2875

data_compression_mode=compression_mode,

2876

data_delta_base=deltainfo.base,

2876

data_delta_base=deltainfo.base,

2877

link_rev=link,

2877

link_rev=link,

2878

parent_rev_1=p1r,

2878

parent_rev_1=p1r,

2879

parent_rev_2=p2r,

2879

parent_rev_2=p2r,

2880

node_id=node,

2880

node_id=node,

2881

sidedata_offset=sidedata_offset,

2881

sidedata_offset=sidedata_offset,

2882

sidedata_compressed_length=len(serialized_sidedata),

2882

sidedata_compressed_length=len(serialized_sidedata),

2883

sidedata_compression_mode=sidedata_compression_mode,

2883

sidedata_compression_mode=sidedata_compression_mode,

2884

rank=rank,

2884

rank=rank,

2885

)

2885

)

2886

2887

self.index.append(e)

2887

self.index.append(e)

2888

entry = self.index.entry_binary(curr)

2888

entry = self.index.entry_binary(curr)

2889

if curr == 0 and self._docket is None:

2889

if curr == 0 and self._docket is None:

2890

header = self._format_flags | self._format_version

2890

header = self._format_flags | self._format_version

2891

header = self.index.pack_header(header)

2891

header = self.index.pack_header(header)

2892

entry = header + entry

2892

entry = header + entry

2893

self._writeentry(

2893

self._writeentry(

2894

transaction,

2894

transaction,

2895

entry,

2895

entry,

2896

deltainfo.data,

2896

deltainfo.data,

2897

link,

2897

link,

2898

offset,

2898

offset,

2899

serialized_sidedata,

2899

serialized_sidedata,

2900

sidedata_offset,

2900

sidedata_offset,

2901

)

2901

)

2902

2903

rawtext = btext[0]

2903

rawtext = btext[0]

2904

2905

if alwayscache and rawtext is None:

2905

if alwayscache and rawtext is None:

2906

rawtext = deltacomputer.buildtext(revinfo)

2906

rawtext = deltacomputer.buildtext(revinfo)

2907

2908

if type(rawtext) == bytes: # only accept immutable objects

2908

if type(rawtext) == bytes: # only accept immutable objects

2909

self._revisioncache = (node, curr, rawtext)

2909

self._revisioncache = (node, curr, rawtext)

2910

self._chainbasecache[curr] = deltainfo.chainbase

2910

self._chainbasecache[curr] = deltainfo.chainbase

2911

return curr

2911

return curr

2912

2913

def _get_data_offset(self, prev):

2913

def _get_data_offset(self, prev):

2914

"""Returns the current offset in the (in-transaction) data file.

2914

"""Returns the current offset in the (in-transaction) data file.

2915

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

2915

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

2916

file to store that information: since sidedata can be rewritten to the

2916

file to store that information: since sidedata can be rewritten to the

2917

end of the data file within a transaction, you can have cases where, for

2917

end of the data file within a transaction, you can have cases where, for

2918

example, rev `n` does not have sidedata while rev `n - 1` does, leading

2918

example, rev `n` does not have sidedata while rev `n - 1` does, leading

2919

to `n - 1`'s sidedata being written after `n`'s data.

2919

to `n - 1`'s sidedata being written after `n`'s data.

2920

2921

TODO cache this in a docket file before getting out of experimental."""

2921

TODO cache this in a docket file before getting out of experimental."""

2922

if self._docket is None:

2922

if self._docket is None:

2923

return self.end(prev)

2923

return self.end(prev)

2924

else:

2924

else:

2925

return self._docket.data_end

2925

return self._docket.data_end

2926

2927

def _writeentry(

2927

def _writeentry(

2928

self, transaction, entry, data, link, offset, sidedata, sidedata_offset

2928

self, transaction, entry, data, link, offset, sidedata, sidedata_offset

2929

):

2929

):

2930

# Files opened in a+ mode have inconsistent behavior on various

2930

# Files opened in a+ mode have inconsistent behavior on various

2931

# platforms. Windows requires that a file positioning call be made

2931

# platforms. Windows requires that a file positioning call be made

2932

# when the file handle transitions between reads and writes. See

2932

# when the file handle transitions between reads and writes. See

2933

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

2933

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

2934

# platforms, Python or the platform itself can be buggy. Some versions

2934

# platforms, Python or the platform itself can be buggy. Some versions

2935

# of Solaris have been observed to not append at the end of the file

2935

# of Solaris have been observed to not append at the end of the file

2936

# if the file was seeked to before the end. See issue4943 for more.

2936

# if the file was seeked to before the end. See issue4943 for more.

2937

#

2937

#

2938

# We work around this issue by inserting a seek() before writing.

2938

# We work around this issue by inserting a seek() before writing.

2939

# Note: This is likely not necessary on Python 3. However, because

2939

# Note: This is likely not necessary on Python 3. However, because

2940

# the file handle is reused for reads and may be seeked there, we need

2940

# the file handle is reused for reads and may be seeked there, we need

2941

# to be careful before changing this.

2941

# to be careful before changing this.

2942

if self._writinghandles is None:

2942

if self._writinghandles is None:

2943

msg = b'adding revision outside `revlog._writing` context'

2943

msg = b'adding revision outside `revlog._writing` context'

2944

raise error.ProgrammingError(msg)

2944

raise error.ProgrammingError(msg)

2945

ifh, dfh, sdfh = self._writinghandles

2945

ifh, dfh, sdfh = self._writinghandles

2946

if self._docket is None:

2946

if self._docket is None:

2947

ifh.seek(0, os.SEEK_END)

2947

ifh.seek(0, os.SEEK_END)

2948

else:

2948

else:

2949

ifh.seek(self._docket.index_end, os.SEEK_SET)

2949

ifh.seek(self._docket.index_end, os.SEEK_SET)

2950

if dfh:

2950

if dfh:

2951

if self._docket is None:

2951

if self._docket is None:

2952

dfh.seek(0, os.SEEK_END)

2952

dfh.seek(0, os.SEEK_END)

2953

else:

2953

else:

2954

dfh.seek(self._docket.data_end, os.SEEK_SET)

2954

dfh.seek(self._docket.data_end, os.SEEK_SET)

2955

if sdfh:

2955

if sdfh:

2956

sdfh.seek(self._docket.sidedata_end, os.SEEK_SET)

2956

sdfh.seek(self._docket.sidedata_end, os.SEEK_SET)

2957

2958

curr = len(self) - 1

2958

curr = len(self) - 1

2959

if not self._inline:

2959

if not self._inline:

2960

transaction.add(self._datafile, offset)

2960

transaction.add(self._datafile, offset)

2961

if self._sidedatafile:

2961

if self._sidedatafile:

2962

transaction.add(self._sidedatafile, sidedata_offset)

2962

transaction.add(self._sidedatafile, sidedata_offset)

2963

transaction.add(self._indexfile, curr * len(entry))

2963

transaction.add(self._indexfile, curr * len(entry))

2964

if data[0]:

2964

if data[0]:

2965

dfh.write(data[0])

2965

dfh.write(data[0])

2966

dfh.write(data[1])

2966

dfh.write(data[1])

2967

if sidedata:

2967

if sidedata:

2968

sdfh.write(sidedata)

2968

sdfh.write(sidedata)

2969

ifh.write(entry)

2969

ifh.write(entry)

2970

else:

2970

else:

2971

offset += curr * self.index.entry_size

2971

offset += curr * self.index.entry_size

2972

transaction.add(self._indexfile, offset)

2972

transaction.add(self._indexfile, offset)

2973

ifh.write(entry)

2973

ifh.write(entry)

2974

ifh.write(data[0])

2974

ifh.write(data[0])

2975

ifh.write(data[1])

2975

ifh.write(data[1])

2976

assert not sidedata

2976

assert not sidedata

2977

self._enforceinlinesize(transaction)

2977

self._enforceinlinesize(transaction)

2978

if self._docket is not None:

2978

if self._docket is not None:

2979

# revlog-v2 always has 3 writing handles, help Pytype

2979

# revlog-v2 always has 3 writing handles, help Pytype

2980

wh1 = self._writinghandles[0]

2980

wh1 = self._writinghandles[0]

2981

wh2 = self._writinghandles[1]

2981

wh2 = self._writinghandles[1]

2982

wh3 = self._writinghandles[2]

2982

wh3 = self._writinghandles[2]

2983

assert wh1 is not None

2983

assert wh1 is not None

2984

assert wh2 is not None

2984

assert wh2 is not None

2985

assert wh3 is not None

2985

assert wh3 is not None

2986

self._docket.index_end = wh1.tell()

2986

self._docket.index_end = wh1.tell()

2987

self._docket.data_end = wh2.tell()

2987

self._docket.data_end = wh2.tell()

2988

self._docket.sidedata_end = wh3.tell()

2988

self._docket.sidedata_end = wh3.tell()

2989

2990

nodemaputil.setup_persistent_nodemap(transaction, self)

2990

nodemaputil.setup_persistent_nodemap(transaction, self)

2991

2992

def addgroup(

2992

def addgroup(

2993

self,

2993

self,

2994

deltas,

2994

deltas,

2995

linkmapper,

2995

linkmapper,

2996

transaction,

2996

transaction,

2997

alwayscache=False,

2997

alwayscache=False,

2998

addrevisioncb=None,

2998

addrevisioncb=None,

2999

duplicaterevisioncb=None,

2999

duplicaterevisioncb=None,

3000

debug_info=None,

3000

debug_info=None,

3001

delta_base_reuse_policy=None,

3001

delta_base_reuse_policy=None,

3002

):

3002

):

3003

"""

3003

"""

3004

add a delta group

3004

add a delta group

3005

3006

given a set of deltas, add them to the revision log. the

3006

given a set of deltas, add them to the revision log. the

3007

first delta is against its parent, which should be in our

3007

first delta is against its parent, which should be in our

3008

log, the rest are against the previous delta.

3008

log, the rest are against the previous delta.

3009

3010

If ``addrevisioncb`` is defined, it will be called with arguments of

3010

If ``addrevisioncb`` is defined, it will be called with arguments of

3011

this revlog and the node that was added.

3011

this revlog and the node that was added.

3012

"""

3012

"""

3013

3014

if self._adding_group:

3014

if self._adding_group:

3015

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3015

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3016

3017

# read the default delta-base reuse policy from revlog config if the

3017

# read the default delta-base reuse policy from revlog config if the

3018

# group did not specify one.

3018

# group did not specify one.

3019

if delta_base_reuse_policy is None:

3019

if delta_base_reuse_policy is None:

3020

if (

3020

if (

3021

self.delta_config.general_delta

3021

self.delta_config.general_delta

3022

and self.delta_config.lazy_delta_base

3022

and self.delta_config.lazy_delta_base

3023

):

3023

):

3024

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3024

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3025

else:

3025

else:

3026

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3026

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3027

3028

self._adding_group = True

3028

self._adding_group = True

3029

empty = True

3029

empty = True

3030

try:

3030

try:

3031

with self._writing(transaction):

3031

with self._writing(transaction):

3032

write_debug = None

3032

write_debug = None

3033

if self.delta_config.debug_delta:

3033

if self.delta_config.debug_delta:

3034

write_debug = transaction._report

3034

write_debug = transaction._report

3035

deltacomputer = deltautil.deltacomputer(

3035

deltacomputer = deltautil.deltacomputer(

3036

self,

3036

self,

3037

write_debug=write_debug,

3037

write_debug=write_debug,

3038

debug_info=debug_info,

3038

debug_info=debug_info,

3039

)

3039

)

3040

# loop through our set of deltas

3040

# loop through our set of deltas

3041

for data in deltas:

3041

for data in deltas:

3042

(

3042

(

3043

node,

3043

node,

3044

p1,

3044

p1,

3045

p2,

3045

p2,

3046

linknode,

3046

linknode,

3047

deltabase,

3047

deltabase,

3048

delta,

3048

delta,

3049

flags,

3049

flags,

3050

sidedata,

3050

sidedata,

3051

) = data

3051

) = data

3052

link = linkmapper(linknode)

3052

link = linkmapper(linknode)

3053

flags = flags or REVIDX_DEFAULT_FLAGS

3053

flags = flags or REVIDX_DEFAULT_FLAGS

3054

3055

rev = self.index.get_rev(node)

3055

rev = self.index.get_rev(node)

3056

if rev is not None:

3056

if rev is not None:

3057

# this can happen if two branches make the same change

3057

# this can happen if two branches make the same change

3058

self._nodeduplicatecallback(transaction, rev)

3058

self._nodeduplicatecallback(transaction, rev)

3059

if duplicaterevisioncb:

3059

if duplicaterevisioncb:

3060

duplicaterevisioncb(self, rev)

3060

duplicaterevisioncb(self, rev)

3061

empty = False

3061

empty = False

3062

continue

3062

continue

3063

3064

for p in (p1, p2):

3064

for p in (p1, p2):

3065

if not self.index.has_node(p):

3065

if not self.index.has_node(p):

3066

raise error.LookupError(

3066

raise error.LookupError(

3067

p, self.radix, _(b'unknown parent')

3067

p, self.radix, _(b'unknown parent')

3068

)

3068

)

3069

3070

if not self.index.has_node(deltabase):

3070

if not self.index.has_node(deltabase):

3071

raise error.LookupError(

3071

raise error.LookupError(

3072

deltabase, self.display_id, _(b'unknown delta base')

3072

deltabase, self.display_id, _(b'unknown delta base')

3073

)

3073

)

3074

3075

baserev = self.rev(deltabase)

3075

baserev = self.rev(deltabase)

3076

3077

if baserev != nullrev and self.iscensored(baserev):

3077

if baserev != nullrev and self.iscensored(baserev):

3078

# if base is censored, delta must be full replacement in a

3078

# if base is censored, delta must be full replacement in a

3079

# single patch operation

3079

# single patch operation

3080

hlen = struct.calcsize(b">lll")

3080

hlen = struct.calcsize(b">lll")

3081

oldlen = self.rawsize(baserev)

3081

oldlen = self.rawsize(baserev)

3082

newlen = len(delta) - hlen

3082

newlen = len(delta) - hlen

3083

if delta[:hlen] != mdiff.replacediffheader(

3083

if delta[:hlen] != mdiff.replacediffheader(

3084

oldlen, newlen

3084

oldlen, newlen

3085

):

3085

):

3086

raise error.CensoredBaseError(

3086

raise error.CensoredBaseError(

3087

self.display_id, self.node(baserev)

3087

self.display_id, self.node(baserev)

3088

)

3088

)

3089

3090

if not flags and self._peek_iscensored(baserev, delta):

3090

if not flags and self._peek_iscensored(baserev, delta):

3091

flags |= REVIDX_ISCENSORED

3091

flags |= REVIDX_ISCENSORED

3092

3093

# We assume consumers of addrevisioncb will want to retrieve

3093

# We assume consumers of addrevisioncb will want to retrieve

3094

# the added revision, which will require a call to

3094

# the added revision, which will require a call to

3095

# revision(). revision() will fast path if there is a cache

3095

# revision(). revision() will fast path if there is a cache

3096

# hit. So, we tell _addrevision() to always cache in this case.

3096

# hit. So, we tell _addrevision() to always cache in this case.

3097

# We're only using addgroup() in the context of changegroup

3097

# We're only using addgroup() in the context of changegroup

3098

# generation so the revision data can always be handled as raw

3098

# generation so the revision data can always be handled as raw

3099

# by the flagprocessor.

3099

# by the flagprocessor.

3100

rev = self._addrevision(

3100

rev = self._addrevision(

3101

node,

3101

node,

3102

None,

3102

None,

3103

transaction,

3103

transaction,

3104

link,

3104

link,

3105

p1,

3105

p1,

3106

p2,

3106

p2,

3107

flags,

3107

flags,

3108

(baserev, delta, delta_base_reuse_policy),

3108

(baserev, delta, delta_base_reuse_policy),

3109

alwayscache=alwayscache,

3109

alwayscache=alwayscache,

3110

deltacomputer=deltacomputer,

3110

deltacomputer=deltacomputer,

3111

sidedata=sidedata,

3111

sidedata=sidedata,

3112

)

3112

)

3113

3114

if addrevisioncb:

3114

if addrevisioncb:

3115

addrevisioncb(self, rev)

3115

addrevisioncb(self, rev)

3116

empty = False

3116

empty = False

3117

finally:

3117

finally:

3118

self._adding_group = False

3118

self._adding_group = False

3119

return not empty

3119

return not empty

3120

3121

def iscensored(self, rev):

3121

def iscensored(self, rev):

3122

"""Check if a file revision is censored."""

3122

"""Check if a file revision is censored."""

3123

if not self.feature_config.censorable:

3123

if not self.feature_config.censorable:

3124

return False

3124

return False

3125

3126

return self.flags(rev) & REVIDX_ISCENSORED

3126

return self.flags(rev) & REVIDX_ISCENSORED

3127

3128

def _peek_iscensored(self, baserev, delta):

3128

def _peek_iscensored(self, baserev, delta):

3129

"""Quickly check if a delta produces a censored revision."""

3129

"""Quickly check if a delta produces a censored revision."""

3130

if not self.feature_config.censorable:

3130

if not self.feature_config.censorable:

3131

return False

3131

return False

3132

3133

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3133

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3134

3135

def getstrippoint(self, minlink):

3135

def getstrippoint(self, minlink):

3136

"""find the minimum rev that must be stripped to strip the linkrev

3136

"""find the minimum rev that must be stripped to strip the linkrev

3137

3138

Returns a tuple containing the minimum rev and a set of all revs that

3138

Returns a tuple containing the minimum rev and a set of all revs that

3139

have linkrevs that will be broken by this strip.

3139

have linkrevs that will be broken by this strip.

3140

"""

3140

"""

3141

return storageutil.resolvestripinfo(

3141

return storageutil.resolvestripinfo(

3142

minlink,

3142

minlink,

3143

len(self) - 1,

3143

len(self) - 1,

3144

self.headrevs(),

3144

self.headrevs(),

3145

self.linkrev,

3145

self.linkrev,

3146

self.parentrevs,

3146

self.parentrevs,

3147

)

3147

)

3148

3149

def strip(self, minlink, transaction):

3149

def strip(self, minlink, transaction):

3150

"""truncate the revlog on the first revision with a linkrev >= minlink

3150

"""truncate the revlog on the first revision with a linkrev >= minlink

3151

3152

This function is called when we're stripping revision minlink and

3152

This function is called when we're stripping revision minlink and

3153

its descendants from the repository.

3153

its descendants from the repository.

3154

3155

We have to remove all revisions with linkrev >= minlink, because

3155

We have to remove all revisions with linkrev >= minlink, because

3156

the equivalent changelog revisions will be renumbered after the

3156

the equivalent changelog revisions will be renumbered after the

3157

strip.

3157

strip.

3158

3159

So we truncate the revlog on the first of these revisions, and

3159

So we truncate the revlog on the first of these revisions, and

3160

trust that the caller has saved the revisions that shouldn't be

3160

trust that the caller has saved the revisions that shouldn't be

3161

removed and that it'll re-add them after this truncation.

3161

removed and that it'll re-add them after this truncation.

3162

"""

3162

"""

3163

if len(self) == 0:

3163

if len(self) == 0:

3164

return

3164

return

3165

3166

rev, _ = self.getstrippoint(minlink)

3166

rev, _ = self.getstrippoint(minlink)

3167

if rev == len(self):

3167

if rev == len(self):

3168

return

3168

return

3169

3170

# first truncate the files on disk

3170

# first truncate the files on disk

3171

data_end = self.start(rev)

3171

data_end = self.start(rev)

3172

if not self._inline:

3172

if not self._inline:

3173

transaction.add(self._datafile, data_end)

3173

transaction.add(self._datafile, data_end)

3174

end = rev * self.index.entry_size

3174

end = rev * self.index.entry_size

3175

else:

3175

else:

3176

end = data_end + (rev * self.index.entry_size)

3176

end = data_end + (rev * self.index.entry_size)

3177

3178

if self._sidedatafile:

3178

if self._sidedatafile:

3179

sidedata_end = self.sidedata_cut_off(rev)

3179

sidedata_end = self.sidedata_cut_off(rev)

3180

transaction.add(self._sidedatafile, sidedata_end)

3180

transaction.add(self._sidedatafile, sidedata_end)

3181

3182

transaction.add(self._indexfile, end)

3182

transaction.add(self._indexfile, end)

3183

if self._docket is not None:

3183

if self._docket is not None:

3184

# XXX we could, leverage the docket while stripping. However it is

3184

# XXX we could, leverage the docket while stripping. However it is

3185

# not powerfull enough at the time of this comment

3185

# not powerfull enough at the time of this comment

3186

self._docket.index_end = end

3186

self._docket.index_end = end

3187

self._docket.data_end = data_end

3187

self._docket.data_end = data_end

3188

self._docket.sidedata_end = sidedata_end

3188

self._docket.sidedata_end = sidedata_end

3189

self._docket.write(transaction, stripping=True)

3189

self._docket.write(transaction, stripping=True)

3190

3191

# then reset internal state in memory to forget those revisions

3191

# then reset internal state in memory to forget those revisions

3192

self._revisioncache = None

3192

self._revisioncache = None

3193

self._chaininfocache = util.lrucachedict(500)

3193

self._chaininfocache = util.lrucachedict(500)

3194

self._segmentfile.clear_cache()

3194

self._segmentfile.clear_cache()

3195

self._segmentfile_sidedata.clear_cache()

3195

self._segmentfile_sidedata.clear_cache()

3196

3197

del self.index[rev:-1]

3197

del self.index[rev:-1]

3198

3199

def checksize(self):

3199

def checksize(self):

3200

"""Check size of index and data files

3200

"""Check size of index and data files

3201

3202

return a (dd, di) tuple.

3202

return a (dd, di) tuple.

3203

- dd: extra bytes for the "data" file

3203

- dd: extra bytes for the "data" file

3204

- di: extra bytes for the "index" file

3204

- di: extra bytes for the "index" file

3205

3206

A healthy revlog will return (0, 0).

3206

A healthy revlog will return (0, 0).

3207

"""

3207

"""

3208

expected = 0

3208

expected = 0

3209

if len(self):

3209

if len(self):

3210

expected = max(0, self.end(len(self) - 1))

3210

expected = max(0, self.end(len(self) - 1))

3211

3212

try:

3212

try:

3213

with self._datafp() as f:

3213

with self._datafp() as f:

3214

f.seek(0, io.SEEK_END)

3214

f.seek(0, io.SEEK_END)

3215

actual = f.tell()

3215

actual = f.tell()

3216

dd = actual - expected

3216

dd = actual - expected

3217

except FileNotFoundError:

3217

except FileNotFoundError:

3218

dd = 0

3218

dd = 0

3219

3220

try:

3220

try:

3221

f = self.opener(self._indexfile)

3221

f = self.opener(self._indexfile)

3222

f.seek(0, io.SEEK_END)

3222

f.seek(0, io.SEEK_END)

3223

actual = f.tell()

3223

actual = f.tell()

3224

f.close()

3224

f.close()

3225

s = self.index.entry_size

3225

s = self.index.entry_size

3226

i = max(0, actual // s)

3226

i = max(0, actual // s)

3227

di = actual - (i * s)

3227

di = actual - (i * s)

3228

if self._inline:

3228

if self._inline:

3229

databytes = 0

3229

databytes = 0

3230

for r in self:

3230

for r in self:

3231

databytes += max(0, self.length(r))

3231

databytes += max(0, self.length(r))

3232

dd = 0

3232

dd = 0

3233

di = actual - len(self) * s - databytes

3233

di = actual - len(self) * s - databytes

3234

except FileNotFoundError:

3234

except FileNotFoundError:

3235

di = 0

3235

di = 0

3236

3237

return (dd, di)

3237

return (dd, di)

3238

3239

def files(self):

3239

def files(self):

3240

res = [self._indexfile]

3240

res = [self._indexfile]

3241

if self._docket_file is None:

3241

if self._docket_file is None:

3242

if not self._inline:

3242

if not self._inline:

3243

res.append(self._datafile)

3243

res.append(self._datafile)

3244

else:

3244

else:

3245

res.append(self._docket_file)

3245

res.append(self._docket_file)

3246

res.extend(self._docket.old_index_filepaths(include_empty=False))

3246

res.extend(self._docket.old_index_filepaths(include_empty=False))

3247

if self._docket.data_end:

3247

if self._docket.data_end:

3248

res.append(self._datafile)

3248

res.append(self._datafile)

3249

res.extend(self._docket.old_data_filepaths(include_empty=False))

3249

res.extend(self._docket.old_data_filepaths(include_empty=False))

3250

if self._docket.sidedata_end:

3250

if self._docket.sidedata_end:

3251

res.append(self._sidedatafile)

3251

res.append(self._sidedatafile)

3252

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3252

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3253

return res

3253

return res

3254

3255

def emitrevisions(

3255

def emitrevisions(

3256

self,

3256

self,

3257

nodes,

3257

nodes,

3258

nodesorder=None,

3258

nodesorder=None,

3259

revisiondata=False,

3259

revisiondata=False,

3260

assumehaveparentrevisions=False,

3260

assumehaveparentrevisions=False,

3261

deltamode=repository.CG_DELTAMODE_STD,

3261

deltamode=repository.CG_DELTAMODE_STD,

3262

sidedata_helpers=None,

3262

sidedata_helpers=None,

3263

debug_info=None,

3263

debug_info=None,

3264

):

3264

):

3265

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3265

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3266

raise error.ProgrammingError(

3266

raise error.ProgrammingError(

3267

b'unhandled value for nodesorder: %s' % nodesorder

3267

b'unhandled value for nodesorder: %s' % nodesorder

3268

)

3268

)

3269

3270

if nodesorder is None and not self.delta_config.general_delta:

3270

if nodesorder is None and not self.delta_config.general_delta:

3271

nodesorder = b'storage'

3271

nodesorder = b'storage'

3272

3273

if (

3273

if (

3274

not self._storedeltachains

3274

not self._storedeltachains

3275

and deltamode != repository.CG_DELTAMODE_PREV

3275

and deltamode != repository.CG_DELTAMODE_PREV

3276

):

3276

):

3277

deltamode = repository.CG_DELTAMODE_FULL

3277

deltamode = repository.CG_DELTAMODE_FULL

3278

3279

return storageutil.emitrevisions(

3279

return storageutil.emitrevisions(

3280

self,

3280

self,

3281

nodes,

3281

nodes,

3282

nodesorder,

3282

nodesorder,

3283

revlogrevisiondelta,

3283

revlogrevisiondelta,

3284

deltaparentfn=self.deltaparent,

3284

deltaparentfn=self.deltaparent,

3285

candeltafn=self._candelta,

3285

candeltafn=self._candelta,

3286

rawsizefn=self.rawsize,

3286

rawsizefn=self.rawsize,

3287

revdifffn=self.revdiff,

3287

revdifffn=self.revdiff,

3288

flagsfn=self.flags,

3288

flagsfn=self.flags,

3289

deltamode=deltamode,

3289

deltamode=deltamode,

3290

revisiondata=revisiondata,

3290

revisiondata=revisiondata,

3291

assumehaveparentrevisions=assumehaveparentrevisions,

3291

assumehaveparentrevisions=assumehaveparentrevisions,

3292

sidedata_helpers=sidedata_helpers,

3292

sidedata_helpers=sidedata_helpers,

3293

debug_info=debug_info,

3293

debug_info=debug_info,

3294

)

3294

)

3295

3296

DELTAREUSEALWAYS = b'always'

3296

DELTAREUSEALWAYS = b'always'

3297

DELTAREUSESAMEREVS = b'samerevs'

3297

DELTAREUSESAMEREVS = b'samerevs'

3298

DELTAREUSENEVER = b'never'

3298

DELTAREUSENEVER = b'never'

3299

3300

DELTAREUSEFULLADD = b'fulladd'

3300

DELTAREUSEFULLADD = b'fulladd'

3301

3302

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3302

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3303

3304

def clone(

3304

def clone(

3305

self,

3305

self,

3306

tr,

3306

tr,

3307

destrevlog,

3307

destrevlog,

3308

addrevisioncb=None,

3308

addrevisioncb=None,

3309

deltareuse=DELTAREUSESAMEREVS,

3309

deltareuse=DELTAREUSESAMEREVS,

3310

forcedeltabothparents=None,

3310

forcedeltabothparents=None,

3311

sidedata_helpers=None,

3311

sidedata_helpers=None,

3312

):

3312

):

3313

"""Copy this revlog to another, possibly with format changes.

3313

"""Copy this revlog to another, possibly with format changes.

3314

3315

The destination revlog will contain the same revisions and nodes.

3315

The destination revlog will contain the same revisions and nodes.

3316

However, it may not be bit-for-bit identical due to e.g. delta encoding

3316

However, it may not be bit-for-bit identical due to e.g. delta encoding

3317

differences.

3317

differences.

3318

3319

The ``deltareuse`` argument control how deltas from the existing revlog

3319

The ``deltareuse`` argument control how deltas from the existing revlog

3320

are preserved in the destination revlog. The argument can have the

3320

are preserved in the destination revlog. The argument can have the

3321

following values:

3321

following values:

3322

3323

DELTAREUSEALWAYS

3323

DELTAREUSEALWAYS

3324

Deltas will always be reused (if possible), even if the destination

3324

Deltas will always be reused (if possible), even if the destination

3325

revlog would not select the same revisions for the delta. This is the

3325

revlog would not select the same revisions for the delta. This is the

3326

fastest mode of operation.

3326

fastest mode of operation.

3327

DELTAREUSESAMEREVS

3327

DELTAREUSESAMEREVS

3328

Deltas will be reused if the destination revlog would pick the same

3328

Deltas will be reused if the destination revlog would pick the same

3329

revisions for the delta. This mode strikes a balance between speed

3329

revisions for the delta. This mode strikes a balance between speed

3330

and optimization.

3330

and optimization.

3331

DELTAREUSENEVER

3331

DELTAREUSENEVER

3332

Deltas will never be reused. This is the slowest mode of execution.

3332

Deltas will never be reused. This is the slowest mode of execution.

3333

This mode can be used to recompute deltas (e.g. if the diff/delta

3333

This mode can be used to recompute deltas (e.g. if the diff/delta

3334

algorithm changes).

3334

algorithm changes).

3335

DELTAREUSEFULLADD

3335

DELTAREUSEFULLADD

3336

Revision will be re-added as if their were new content. This is

3336

Revision will be re-added as if their were new content. This is

3337

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3337

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3338

eg: large file detection and handling.

3338

eg: large file detection and handling.

3339

3340

Delta computation can be slow, so the choice of delta reuse policy can

3340

Delta computation can be slow, so the choice of delta reuse policy can

3341

significantly affect run time.

3341

significantly affect run time.

3342

3343

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3343

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3344

two extremes. Deltas will be reused if they are appropriate. But if the

3344

two extremes. Deltas will be reused if they are appropriate. But if the

3345

delta could choose a better revision, it will do so. This means if you

3345

delta could choose a better revision, it will do so. This means if you

3346

are converting a non-generaldelta revlog to a generaldelta revlog,

3346

are converting a non-generaldelta revlog to a generaldelta revlog,

3347

deltas will be recomputed if the delta's parent isn't a parent of the

3347

deltas will be recomputed if the delta's parent isn't a parent of the

3348

revision.

3348

revision.

3349

3350

In addition to the delta policy, the ``forcedeltabothparents``

3350

In addition to the delta policy, the ``forcedeltabothparents``

3351

argument controls whether to force compute deltas against both parents

3351

argument controls whether to force compute deltas against both parents

3352

for merges. By default, the current default is used.

3352

for merges. By default, the current default is used.

3353

3354

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3354

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3355

`sidedata_helpers`.

3355

`sidedata_helpers`.

3356

"""

3356

"""

3357

if deltareuse not in self.DELTAREUSEALL:

3357

if deltareuse not in self.DELTAREUSEALL:

3358

raise ValueError(

3358

raise ValueError(

3359

_(b'value for deltareuse invalid: %s') % deltareuse

3359

_(b'value for deltareuse invalid: %s') % deltareuse

3360

)

3360

)

3361

3362

if len(destrevlog):

3362

if len(destrevlog):

3363

raise ValueError(_(b'destination revlog is not empty'))

3363

raise ValueError(_(b'destination revlog is not empty'))

3364

3365

if getattr(self, 'filteredrevs', None):

3365

if getattr(self, 'filteredrevs', None):

3366

raise ValueError(_(b'source revlog has filtered revisions'))

3366

raise ValueError(_(b'source revlog has filtered revisions'))

3367

if getattr(destrevlog, 'filteredrevs', None):

3367

if getattr(destrevlog, 'filteredrevs', None):

3368

raise ValueError(_(b'destination revlog has filtered revisions'))

3368

raise ValueError(_(b'destination revlog has filtered revisions'))

3369

3370

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3370

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3371

# if possible.

3371

# if possible.

3372

old_delta_config = destrevlog.delta_config

3372

old_delta_config = destrevlog.delta_config

3373

destrevlog.delta_config = destrevlog.delta_config.copy()

3373

destrevlog.delta_config = destrevlog.delta_config.copy()

3374

3375

try:

3375

try:

3376

if deltareuse == self.DELTAREUSEALWAYS:

3376

if deltareuse == self.DELTAREUSEALWAYS:

3377

destrevlog.delta_config.lazy_delta_base = True

3377

destrevlog.delta_config.lazy_delta_base = True

3378

destrevlog.delta_config.lazy_delta = True

3378

destrevlog.delta_config.lazy_delta = True

3379

elif deltareuse == self.DELTAREUSESAMEREVS:

3379

elif deltareuse == self.DELTAREUSESAMEREVS:

3380

destrevlog.delta_config.lazy_delta_base = False

3380

destrevlog.delta_config.lazy_delta_base = False

3381

destrevlog.delta_config.lazy_delta = True

3381

destrevlog.delta_config.lazy_delta = True

3382

elif deltareuse == self.DELTAREUSENEVER:

3382

elif deltareuse == self.DELTAREUSENEVER:

3383

destrevlog.delta_config.lazy_delta_base = False

3383

destrevlog.delta_config.lazy_delta_base = False

3384

destrevlog.delta_config.lazy_delta = False

3384

destrevlog.delta_config.lazy_delta = False

3385

3386

delta_both_parents = (

3386

delta_both_parents = (

3387

forcedeltabothparents or old_delta_config.delta_both_parents

3387

forcedeltabothparents or old_delta_config.delta_both_parents

3388

)

3388

)

3389

destrevlog.delta_config.delta_both_parents = delta_both_parents

3389

destrevlog.delta_config.delta_both_parents = delta_both_parents

3390

3391

with self.reading():

3391

with self.reading():

3392

self._clone(

3392

self._clone(

3393

tr,

3393

tr,

3394

destrevlog,

3394

destrevlog,

3395

addrevisioncb,

3395

addrevisioncb,

3396

deltareuse,

3396

deltareuse,

3397

forcedeltabothparents,

3397

forcedeltabothparents,

3398

sidedata_helpers,

3398

sidedata_helpers,

3399

)

3399

)

3400

3401

finally:

3401

finally:

3402

destrevlog.delta_config = old_delta_config

3402

destrevlog.delta_config = old_delta_config

3403

3404

def _clone(

3404

def _clone(

3405

self,

3405

self,

3406

tr,

3406

tr,

3407

destrevlog,

3407

destrevlog,

3408

addrevisioncb,

3408

addrevisioncb,

3409

deltareuse,

3409

deltareuse,

3410

forcedeltabothparents,

3410

forcedeltabothparents,

3411

sidedata_helpers,

3411

sidedata_helpers,

3412

):

3412

):

3413

"""perform the core duty of `revlog.clone` after parameter processing"""

3413

"""perform the core duty of `revlog.clone` after parameter processing"""

3414

write_debug = None

3414

write_debug = None

3415

if self.delta_config.debug_delta:

3415

if self.delta_config.debug_delta:

3416

write_debug = tr._report

3416

write_debug = tr._report

3417

deltacomputer = deltautil.deltacomputer(

3417

deltacomputer = deltautil.deltacomputer(

3418

destrevlog,

3418

destrevlog,

3419

write_debug=write_debug,

3419

write_debug=write_debug,

3420

)

3420

)

3421

index = self.index

3421

index = self.index

3422

for rev in self:

3422

for rev in self:

3423

entry = index[rev]

3423

entry = index[rev]

3424

3425

# Some classes override linkrev to take filtered revs into

3425

# Some classes override linkrev to take filtered revs into

3426

# account. Use raw entry from index.

3426

# account. Use raw entry from index.

3427

flags = entry[0] & 0xFFFF

3427

flags = entry[0] & 0xFFFF

3428

linkrev = entry[4]

3428

linkrev = entry[4]

3429

p1 = index[entry[5]][7]

3429

p1 = index[entry[5]][7]

3430

p2 = index[entry[6]][7]

3430

p2 = index[entry[6]][7]

3431

node = entry[7]

3431

node = entry[7]

3432

3433

# (Possibly) reuse the delta from the revlog if allowed and

3433

# (Possibly) reuse the delta from the revlog if allowed and

3434

# the revlog chunk is a delta.

3434

# the revlog chunk is a delta.

3435

cachedelta = None

3435

cachedelta = None

3436

rawtext = None

3436

rawtext = None

3437

if deltareuse == self.DELTAREUSEFULLADD:

3437

if deltareuse == self.DELTAREUSEFULLADD:

3438

text = self._revisiondata(rev)

3438

text = self._revisiondata(rev)

3439

sidedata = self.sidedata(rev)

3439

sidedata = self.sidedata(rev)

3440

3441

if sidedata_helpers is not None:

3441

if sidedata_helpers is not None:

3442

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3442

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3443

self, sidedata_helpers, sidedata, rev

3443

self, sidedata_helpers, sidedata, rev

3444

)

3444

)

3445

flags = flags | new_flags[0] & ~new_flags[1]

3445

flags = flags | new_flags[0] & ~new_flags[1]

3446

3447

destrevlog.addrevision(

3447

destrevlog.addrevision(

3448

text,

3448

text,

3449

tr,

3449

tr,

3450

linkrev,

3450

linkrev,

3451

p1,

3451

p1,

3452

p2,

3452

p2,

3453

cachedelta=cachedelta,

3453

cachedelta=cachedelta,

3454

node=node,

3454

node=node,

3455

flags=flags,

3455

flags=flags,

3456

deltacomputer=deltacomputer,

3456

deltacomputer=deltacomputer,

3457

sidedata=sidedata,

3457

sidedata=sidedata,

3458

)

3458

)

3459

else:

3459

else:

3460

if destrevlog._lazydelta:

3460

if destrevlog._lazydelta:

3461

dp = self.deltaparent(rev)

3461

dp = self.deltaparent(rev)

3462

if dp != nullrev:

3462

if dp != nullrev:

3463

cachedelta = (dp, bytes(self._chunk(rev)))

3463

cachedelta = (dp, bytes(self._chunk(rev)))

3464

3465

sidedata = None

3465

sidedata = None

3466

if not cachedelta:

3466

if not cachedelta:

3467

rawtext = self._revisiondata(rev)

3467

rawtext = self._revisiondata(rev)

3468

sidedata = self.sidedata(rev)

3468

sidedata = self.sidedata(rev)

3469

if sidedata is None:

3469

if sidedata is None:

3470

sidedata = self.sidedata(rev)

3470

sidedata = self.sidedata(rev)

3471

3472

if sidedata_helpers is not None:

3472

if sidedata_helpers is not None:

3473

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3473

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3474

self, sidedata_helpers, sidedata, rev

3474

self, sidedata_helpers, sidedata, rev

3475

)

3475

)

3476

flags = flags | new_flags[0] & ~new_flags[1]

3476

flags = flags | new_flags[0] & ~new_flags[1]

3477

3478

with destrevlog._writing(tr):

3478

with destrevlog._writing(tr):

3479

destrevlog._addrevision(

3479

destrevlog._addrevision(

3480

node,

3480

node,

3481

rawtext,

3481

rawtext,

3482

tr,

3482

tr,

3483

linkrev,

3483

linkrev,

3484

p1,

3484

p1,

3485

p2,

3485

p2,

3486

flags,

3486

flags,

3487

cachedelta,

3487

cachedelta,

3488

deltacomputer=deltacomputer,

3488

deltacomputer=deltacomputer,

3489

sidedata=sidedata,

3489

sidedata=sidedata,

3490

)

3490

)

3491

3492

if addrevisioncb:

3492

if addrevisioncb:

3493

addrevisioncb(self, rev, node)

3493

addrevisioncb(self, rev, node)

3494

3495

def censorrevision(self, tr, censornode, tombstone=b''):

3495

def censorrevision(self, tr, censornode, tombstone=b''):

3496

if self._format_version == REVLOGV0:

3496

if self._format_version == REVLOGV0:

3497

raise error.RevlogError(

3497

raise error.RevlogError(

3498

_(b'cannot censor with version %d revlogs')

3498

_(b'cannot censor with version %d revlogs')

3499

% self._format_version

3499

% self._format_version

3500

)

3500

)

3501

elif self._format_version == REVLOGV1:

3501

elif self._format_version == REVLOGV1:

3502

rewrite.v1_censor(self, tr, censornode, tombstone)

3502

rewrite.v1_censor(self, tr, censornode, tombstone)

3503

else:

3503

else:

3504

rewrite.v2_censor(self, tr, censornode, tombstone)

3504

rewrite.v2_censor(self, tr, censornode, tombstone)

3505

3506

def verifyintegrity(self, state):

3506

def verifyintegrity(self, state):

3507

"""Verifies the integrity of the revlog.

3507

"""Verifies the integrity of the revlog.

3508

3509

Yields ``revlogproblem`` instances describing problems that are

3509

Yields ``revlogproblem`` instances describing problems that are

3510

found.

3510

found.

3511

"""

3511

"""

3512

dd, di = self.checksize()

3512

dd, di = self.checksize()

3513

if dd:

3513

if dd:

3514

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3514

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3515

if di:

3515

if di:

3516

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3516

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3517

3518

version = self._format_version

3518

version = self._format_version

3519

3520

# The verifier tells us what version revlog we should be.

3520

# The verifier tells us what version revlog we should be.

3521

if version != state[b'expectedversion']:

3521

if version != state[b'expectedversion']:

3522

yield revlogproblem(

3522

yield revlogproblem(

3523

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3523

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3524

% (self.display_id, version, state[b'expectedversion'])

3524

% (self.display_id, version, state[b'expectedversion'])

3525

)

3525

)

3526

3527

state[b'skipread'] = set()

3527

state[b'skipread'] = set()

3528

state[b'safe_renamed'] = set()

3528

state[b'safe_renamed'] = set()

3529

3530

for rev in self:

3530

for rev in self:

3531

node = self.node(rev)

3531

node = self.node(rev)

3532

3533

# Verify contents. 4 cases to care about:

3533

# Verify contents. 4 cases to care about:

3534

#

3534

#

3535

# common: the most common case

3535

# common: the most common case

3536

# rename: with a rename

3536

# rename: with a rename

3537

# meta: file content starts with b'\1\n', the metadata

3537

# meta: file content starts with b'\1\n', the metadata

3538

# header defined in filelog.py, but without a rename

3538

# header defined in filelog.py, but without a rename

3539

# ext: content stored externally

3539

# ext: content stored externally

3540

#

3540

#

3541

# More formally, their differences are shown below:

3541

# More formally, their differences are shown below:

3542

#

3542

#

3543

# | common | rename | meta | ext

3543

# | common | rename | meta | ext

3544

# -------------------------------------------------------

3544

# -------------------------------------------------------

3545

# flags() | 0 | 0 | 0 | not 0

3545

# flags() | 0 | 0 | 0 | not 0

3546

# renamed() | False | True | False | ?

3546

# renamed() | False | True | False | ?

3547

# rawtext[0:2]=='\1\n'| False | True | True | ?

3547

# rawtext[0:2]=='\1\n'| False | True | True | ?

3548

#

3548

#

3549

# "rawtext" means the raw text stored in revlog data, which

3549

# "rawtext" means the raw text stored in revlog data, which

3550

# could be retrieved by "rawdata(rev)". "text"

3550

# could be retrieved by "rawdata(rev)". "text"

3551

# mentioned below is "revision(rev)".

3551

# mentioned below is "revision(rev)".

3552

#

3552

#

3553

# There are 3 different lengths stored physically:

3553

# There are 3 different lengths stored physically:

3554

# 1. L1: rawsize, stored in revlog index

3554

# 1. L1: rawsize, stored in revlog index

3555

# 2. L2: len(rawtext), stored in revlog data

3555

# 2. L2: len(rawtext), stored in revlog data

3556

# 3. L3: len(text), stored in revlog data if flags==0, or

3556

# 3. L3: len(text), stored in revlog data if flags==0, or

3557

# possibly somewhere else if flags!=0

3557

# possibly somewhere else if flags!=0

3558

#

3558

#

3559

# L1 should be equal to L2. L3 could be different from them.

3559

# L1 should be equal to L2. L3 could be different from them.

3560

# "text" may or may not affect commit hash depending on flag

3560

# "text" may or may not affect commit hash depending on flag

3561

# processors (see flagutil.addflagprocessor).

3561

# processors (see flagutil.addflagprocessor).

3562

#

3562

#

3563

# | common | rename | meta | ext

3563

# | common | rename | meta | ext

3564

# -------------------------------------------------

3564

# -------------------------------------------------

3565

# rawsize() | L1 | L1 | L1 | L1

3565

# rawsize() | L1 | L1 | L1 | L1

3566

# size() | L1 | L2-LM | L1(*) | L1 (?)

3566

# size() | L1 | L2-LM | L1(*) | L1 (?)

3567

# len(rawtext) | L2 | L2 | L2 | L2

3567

# len(rawtext) | L2 | L2 | L2 | L2

3568

# len(text) | L2 | L2 | L2 | L3

3568

# len(text) | L2 | L2 | L2 | L3

3569

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3569

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3570

#

3570

#

3571

# LM: length of metadata, depending on rawtext

3571

# LM: length of metadata, depending on rawtext

3572

# (*): not ideal, see comment in filelog.size

3572

# (*): not ideal, see comment in filelog.size

3573

# (?): could be "- len(meta)" if the resolved content has

3573

# (?): could be "- len(meta)" if the resolved content has

3574

# rename metadata

3574

# rename metadata

3575

#

3575

#

3576

# Checks needed to be done:

3576

# Checks needed to be done:

3577

# 1. length check: L1 == L2, in all cases.

3577

# 1. length check: L1 == L2, in all cases.

3578

# 2. hash check: depending on flag processor, we may need to

3578

# 2. hash check: depending on flag processor, we may need to

3579

# use either "text" (external), or "rawtext" (in revlog).

3579

# use either "text" (external), or "rawtext" (in revlog).

3580

3581

try:

3581

try:

3582

skipflags = state.get(b'skipflags', 0)

3582

skipflags = state.get(b'skipflags', 0)

3583

if skipflags:

3583

if skipflags:

3584

skipflags &= self.flags(rev)

3584

skipflags &= self.flags(rev)

3585

3586

_verify_revision(self, skipflags, state, node)

3586

_verify_revision(self, skipflags, state, node)

3587

3588

l1 = self.rawsize(rev)

3588

l1 = self.rawsize(rev)

3589

l2 = len(self.rawdata(node))

3589

l2 = len(self.rawdata(node))

3590

3591

if l1 != l2:

3591

if l1 != l2:

3592

yield revlogproblem(

3592

yield revlogproblem(

3593

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3593

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3594

node=node,

3594

node=node,

3595

)

3595

)

3596

3597

except error.CensoredNodeError:

3597

except error.CensoredNodeError:

3598

if state[b'erroroncensored']:

3598

if state[b'erroroncensored']:

3599

yield revlogproblem(

3599

yield revlogproblem(

3600

error=_(b'censored file data'), node=node

3600

error=_(b'censored file data'), node=node

3601

)

3601

)

3602

state[b'skipread'].add(node)

3602

state[b'skipread'].add(node)

3603

except Exception as e:

3603

except Exception as e:

3604

yield revlogproblem(

3604

yield revlogproblem(

3605

error=_(b'unpacking %s: %s')

3605

error=_(b'unpacking %s: %s')

3606

% (short(node), stringutil.forcebytestr(e)),

3606

% (short(node), stringutil.forcebytestr(e)),

3607

node=node,

3607

node=node,

3608

)

3608

)

3609

state[b'skipread'].add(node)

3609

state[b'skipread'].add(node)

3610

3611

def storageinfo(

3611

def storageinfo(

3612

self,

3612

self,

3613

exclusivefiles=False,

3613

exclusivefiles=False,

3614

sharedfiles=False,

3614

sharedfiles=False,

3615

revisionscount=False,

3615

revisionscount=False,

3616

trackedsize=False,

3616

trackedsize=False,

3617

storedsize=False,

3617

storedsize=False,

3618

):

3618

):

3619

d = {}

3619

d = {}

3620

3621

if exclusivefiles:

3621

if exclusivefiles:

3622

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3622

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3623

if not self._inline:

3623

if not self._inline:

3624

d[b'exclusivefiles'].append((self.opener, self._datafile))

3624

d[b'exclusivefiles'].append((self.opener, self._datafile))

3625

3626

if sharedfiles:

3626

if sharedfiles:

3627

d[b'sharedfiles'] = []

3627

d[b'sharedfiles'] = []

3628

3629

if revisionscount:

3629

if revisionscount:

3630

d[b'revisionscount'] = len(self)

3630

d[b'revisionscount'] = len(self)

3631

3632

if trackedsize:

3632

if trackedsize:

3633

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3633

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3634

3635

if storedsize:

3635

if storedsize:

3636

d[b'storedsize'] = sum(

3636

d[b'storedsize'] = sum(

3637

self.opener.stat(path).st_size for path in self.files()

3637

self.opener.stat(path).st_size for path in self.files()

3638

)

3638

)

3639

3640

return d

3640

return d

3641

3642

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3642

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3643

if not self.feature_config.has_side_data:

3643

if not self.feature_config.has_side_data:

3644

return

3644

return

3645

# revlog formats with sidedata support does not support inline

3645

# revlog formats with sidedata support does not support inline

3646

assert not self._inline

3646

assert not self._inline

3647

if not helpers[1] and not helpers[2]:

3647

if not helpers[1] and not helpers[2]:

3648

# Nothing to generate or remove

3648

# Nothing to generate or remove

3649

return

3649

return

3650

3651

new_entries = []

3651

new_entries = []

3652

# append the new sidedata

3652

# append the new sidedata

3653

with self._writing(transaction):

3653

with self._writing(transaction):

3654

ifh, dfh, sdfh = self._writinghandles

3654

ifh, dfh, sdfh = self._writinghandles

3655

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3655

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3656

3657

current_offset = sdfh.tell()

3657

current_offset = sdfh.tell()

3658

for rev in range(startrev, endrev + 1):

3658

for rev in range(startrev, endrev + 1):

3659

entry = self.index[rev]

3659

entry = self.index[rev]

3660

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

3660

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

3661

store=self,

3661

store=self,

3662

sidedata_helpers=helpers,

3662

sidedata_helpers=helpers,

3663

sidedata={},

3663

sidedata={},

3664

rev=rev,

3664

rev=rev,

3665

)

3665

)

3666

3667

serialized_sidedata = sidedatautil.serialize_sidedata(

3667

serialized_sidedata = sidedatautil.serialize_sidedata(

3668

new_sidedata

3668

new_sidedata

3669

)

3669

)

3670

3671

sidedata_compression_mode = COMP_MODE_INLINE

3671

sidedata_compression_mode = COMP_MODE_INLINE

3672

if serialized_sidedata and self.feature_config.has_side_data:

3672

if serialized_sidedata and self.feature_config.has_side_data:

3673

sidedata_compression_mode = COMP_MODE_PLAIN

3673

sidedata_compression_mode = COMP_MODE_PLAIN

3674

h, comp_sidedata = self.compress(serialized_sidedata)

3674

h, comp_sidedata = self.compress(serialized_sidedata)

3675

if (

3675

if (

3676

h != b'u'

3676

h != b'u'

3677

and comp_sidedata[0] != b'\0'

3677

and comp_sidedata[0] != b'\0'

3678

and len(comp_sidedata) < len(serialized_sidedata)

3678

and len(comp_sidedata) < len(serialized_sidedata)

3679

):

3679

):

3680

assert not h

3680

assert not h

3681

if (

3681

if (

3682

comp_sidedata[0]

3682

comp_sidedata[0]

3683

== self._docket.default_compression_header

3683

== self._docket.default_compression_header

3684

):

3684

):

3685

sidedata_compression_mode = COMP_MODE_DEFAULT

3685

sidedata_compression_mode = COMP_MODE_DEFAULT

3686

serialized_sidedata = comp_sidedata

3686

serialized_sidedata = comp_sidedata

3687

else:

3687

else:

3688

sidedata_compression_mode = COMP_MODE_INLINE

3688

sidedata_compression_mode = COMP_MODE_INLINE

3689

serialized_sidedata = comp_sidedata

3689

serialized_sidedata = comp_sidedata

3690

if entry[8] != 0 or entry[9] != 0:

3690

if entry[8] != 0 or entry[9] != 0:

3691

# rewriting entries that already have sidedata is not

3691

# rewriting entries that already have sidedata is not

3692

# supported yet, because it introduces garbage data in the

3692

# supported yet, because it introduces garbage data in the

3693

# revlog.

3693

# revlog.

3694

msg = b"rewriting existing sidedata is not supported yet"

3694

msg = b"rewriting existing sidedata is not supported yet"

3695

raise error.Abort(msg)

3695

raise error.Abort(msg)

3696

3697

# Apply (potential) flags to add and to remove after running

3697

# Apply (potential) flags to add and to remove after running

3698

# the sidedata helpers

3698

# the sidedata helpers

3699

new_offset_flags = entry[0] | flags[0] & ~flags[1]

3699

new_offset_flags = entry[0] | flags[0] & ~flags[1]

3700

entry_update = (

3700

entry_update = (

3701

current_offset,

3701

current_offset,

3702

len(serialized_sidedata),

3702

len(serialized_sidedata),

3703

new_offset_flags,

3703

new_offset_flags,

3704

sidedata_compression_mode,

3704

sidedata_compression_mode,

3705

)

3705

)

3706

3707

# the sidedata computation might have move the file cursors around

3707

# the sidedata computation might have move the file cursors around

3708

sdfh.seek(current_offset, os.SEEK_SET)

3708

sdfh.seek(current_offset, os.SEEK_SET)

3709

sdfh.write(serialized_sidedata)

3709

sdfh.write(serialized_sidedata)

3710

new_entries.append(entry_update)

3710

new_entries.append(entry_update)

3711

current_offset += len(serialized_sidedata)

3711

current_offset += len(serialized_sidedata)

3712

self._docket.sidedata_end = sdfh.tell()

3712

self._docket.sidedata_end = sdfh.tell()

3713

3714

# rewrite the new index entries

3714

# rewrite the new index entries

3715

ifh.seek(startrev * self.index.entry_size)

3715

ifh.seek(startrev * self.index.entry_size)

3716

for i, e in enumerate(new_entries):

3716

for i, e in enumerate(new_entries):

3717

rev = startrev + i

3717

rev = startrev + i

3718

self.index.replace_sidedata_info(rev, *e)

3718

self.index.replace_sidedata_info(rev, *e)

3719

packed = self.index.entry_binary(rev)

3719

packed = self.index.entry_binary(rev)

3720

if rev == 0 and self._docket is None:

3720

if rev == 0 and self._docket is None:

3721

header = self._format_flags | self._format_version

3721

header = self._format_flags | self._format_version

3722

header = self.index.pack_header(header)

3722

header = self.index.pack_header(header)

3723

packed = header + packed

3723

packed = header + packed

3724

ifh.write(packed)

3724

ifh.write(packed)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             # coding: utf8
             #
             # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             import binascii
             import collections
             import contextlib
             import io
             import os
             import struct
             import weakref
             import zlib
             # import stuff from node for others to import from revlog
             from .node import (
                 bin,
                 hex,
                 nullrev,
                 sha1nodeconstants,
                 short,
                 wdirrev,
             )
             from .i18n import _
             from .revlogutils.constants import (
                 ALL_KINDS,
                 CHANGELOGV2,
                 COMP_MODE_DEFAULT,
                 COMP_MODE_INLINE,
                 COMP_MODE_PLAIN,
                 DELTA_BASE_REUSE_NO,
                 DELTA_BASE_REUSE_TRY,
                 ENTRY_RANK,
                 FEATURES_BY_VERSION,
                 FLAG_GENERALDELTA,
                 FLAG_INLINE_DATA,
                 INDEX_HEADER,
                 KIND_CHANGELOG,
                 KIND_FILELOG,
                 RANK_UNKNOWN,
                 REVLOGV0,
                 REVLOGV1,
                 REVLOGV1_FLAGS,
                 REVLOGV2,
                 REVLOGV2_FLAGS,
                 REVLOG_DEFAULT_FLAGS,
                 REVLOG_DEFAULT_FORMAT,
                 REVLOG_DEFAULT_VERSION,
                 SUPPORTED_FLAGS,
             )
             from .revlogutils.flagutil import (
                 REVIDX_DEFAULT_FLAGS,
                 REVIDX_ELLIPSIS,
                 REVIDX_EXTSTORED,
                 REVIDX_FLAGS_ORDER,
                 REVIDX_HASCOPIESINFO,
                 REVIDX_ISCENSORED,
                 REVIDX_RAWTEXT_CHANGING_FLAGS,
             )
             from .thirdparty import attr
             from . import (
                 ancestor,
                 dagop,
                 error,
                 mdiff,
                 policy,
                 pycompat,
                 revlogutils,
                 templatefilters,
                 util,
             )
             from .interfaces import (
                 repository,
                 util as interfaceutil,
             )
             from .revlogutils import (
                 deltas as deltautil,
                 docket as docketutil,
                 flagutil,
                 nodemap as nodemaputil,
                 randomaccessfile,
                 revlogv0,
                 rewrite,
                 sidedata as sidedatautil,
             )
             from .utils import (
                 storageutil,
                 stringutil,
             )
             # blanked usage of all the name to prevent pyflakes constraints
             # We need these name available in the module for extensions.
             REVLOGV0
             REVLOGV1
             REVLOGV2
             CHANGELOGV2
             FLAG_INLINE_DATA
             FLAG_GENERALDELTA
             REVLOG_DEFAULT_FLAGS
             REVLOG_DEFAULT_FORMAT
             REVLOG_DEFAULT_VERSION
             REVLOGV1_FLAGS
             REVLOGV2_FLAGS
             REVIDX_ISCENSORED
             REVIDX_ELLIPSIS
             REVIDX_HASCOPIESINFO
             REVIDX_EXTSTORED
             REVIDX_DEFAULT_FLAGS
             REVIDX_FLAGS_ORDER
             REVIDX_RAWTEXT_CHANGING_FLAGS
             parsers = policy.importmod('parsers')
             rustancestor = policy.importrust('ancestor')
             rustdagop = policy.importrust('dagop')
             rustrevlog = policy.importrust('revlog')
             # Aliased for performance.
             _zlibdecompress = zlib.decompress
             # max size of inline data embedded into a revlog
             _maxinline = 131072
             # Flag processors for REVIDX_ELLIPSIS.
             def ellipsisreadprocessor(rl, text):
                 return text, False
             def ellipsiswriteprocessor(rl, text):
                 return text, False
             def ellipsisrawprocessor(rl, text):
                 return False
             ellipsisprocessor = (
                 ellipsisreadprocessor,
                 ellipsiswriteprocessor,
                 ellipsisrawprocessor,
             )
             def _verify_revision(rl, skipflags, state, node):
                 """Verify the integrity of the given revlog ``node`` while providing a hook
                 point for extensions to influence the operation."""
                 if skipflags:
                     state[b'skipread'].add(node)
                 else:
                     # Side-effect: read content and verify hash.
                     rl.revision(node)
             # True if a fast implementation for persistent-nodemap is available
             #
             # We also consider we have a "fast" implementation in "pure" python because
             # people using pure don't really have performance consideration (and a
             # wheelbarrow of other slowness source)
             HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(
                 parsers, 'BaseIndexObject'
             )
             @interfaceutil.implementer(repository.irevisiondelta)
             @attr.s(slots=True)
             class revlogrevisiondelta:
                 node = attr.ib()
                 p1node = attr.ib()
                 p2node = attr.ib()
                 basenode = attr.ib()
                 flags = attr.ib()
                 baserevisionsize = attr.ib()
                 revision = attr.ib()
                 delta = attr.ib()
                 sidedata = attr.ib()
                 protocol_flags = attr.ib()
                 linknode = attr.ib(default=None)
             @interfaceutil.implementer(repository.iverifyproblem)
             @attr.s(frozen=True)
             class revlogproblem:
                 warning = attr.ib(default=None)
                 error = attr.ib(default=None)
                 node = attr.ib(default=None)
             def parse_index_v1(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline)
                 return index, cache
             def parse_index_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)
                 return index, cache
             def parse_index_cl_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)
                 return index, cache
             if hasattr(parsers, 'parse_index_devel_nodemap'):
                 def parse_index_v1_nodemap(data, inline):
                     index, cache = parsers.parse_index_devel_nodemap(data, inline)
                     return index, cache
             else:
                 parse_index_v1_nodemap = None
             def parse_index_v1_mixed(data, inline):
                 index, cache = parse_index_v1(data, inline)
                 return rustrevlog.MixedIndex(index), cache
             # corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
             # signed integer)
             _maxentrysize = 0x7FFFFFFF
             FILE_TOO_SHORT_MSG = _(
                 b'cannot read from revlog %s;'
                 b'  expected %d bytes from offset %d, data size is %d'
             )
             hexdigits = b'0123456789abcdefABCDEF'
             class _Config:
                 def copy(self):
                     return self.__class__(**self.__dict__)
             @attr.s()
             class FeatureConfig(_Config):
                 """Hold configuration values about the available revlog features"""
                 # the default compression engine
                 compression_engine = attr.ib(default=b'zlib')
                 # compression engines options
                 compression_engine_options = attr.ib(default=attr.Factory(dict))
                 # can we use censor on this revlog
                 censorable = attr.ib(default=False)
                 # does this revlog use the "side data" feature
                 has_side_data = attr.ib(default=False)
                 # might remove rank configuration once the computation has no impact
                 compute_rank = attr.ib(default=False)
                 # parent order is supposed to be semantically irrelevant, so we
                 # normally resort parents to ensure that the first parent is non-null,
                 # if there is a non-null parent at all.
                 # filelog abuses the parent order as flag to mark some instances of
                 # meta-encoded files, so allow it to disable this behavior.
                 canonical_parent_order = attr.ib(default=False)
                 # can ellipsis commit be used
                 enable_ellipsis = attr.ib(default=False)
                 def copy(self):
                     new = super().copy()
                     new.compression_engine_options = self.compression_engine_options.copy()
                     return new
             @attr.s()
             class DataConfig(_Config):
                 """Hold configuration value about how the revlog data are read"""
                 # should we try to open the "pending" version of the revlog
                 try_pending = attr.ib(default=False)
                 # should we try to open the "splitted" version of the revlog
                 try_split = attr.ib(default=False)
                 #  When True, indexfile should be opened with checkambig=True at writing,
                 #  to avoid file stat ambiguity.
                 check_ambig = attr.ib(default=False)
                 # If true, use mmap instead of reading to deal with large index
                 mmap_large_index = attr.ib(default=False)
                 # how much data is large
                 mmap_index_threshold = attr.ib(default=None)
                 # How much data to read and cache into the raw revlog data cache.
                 chunk_cache_size = attr.ib(default=65536)
                 # Allow sparse reading of the revlog data
                 with_sparse_read = attr.ib(default=False)
                 # minimal density of a sparse read chunk
                 sr_density_threshold = attr.ib(default=0.50)
                 # minimal size of data we skip when performing sparse read
                 sr_min_gap_size = attr.ib(default=262144)
                 # are delta encoded against arbitrary bases.
                 generaldelta = attr.ib(default=False)
             @attr.s()
             class DeltaConfig(_Config):
                 """Hold configuration value about how new delta are computed
                 Some attributes are duplicated from DataConfig to help havign each object
                 self contained.
                 """
                 # can delta be encoded against arbitrary bases.
                 general_delta = attr.ib(default=False)
                 # Allow sparse writing of the revlog data
                 sparse_revlog = attr.ib(default=False)
                 # maximum length of a delta chain
                 max_chain_len = attr.ib(default=None)
                 # Maximum distance between delta chain base start and end
                 max_deltachain_span = attr.ib(default=-1)
                 # If `upper_bound_comp` is not None, this is the expected maximal gain from
                 # compression for the data content.
                 upper_bound_comp = attr.ib(default=None)
                 # Should we try a delta against both parent
                 delta_both_parents = attr.ib(default=True)
                 # Test delta base candidate group by chunk of this maximal size.
                 candidate_group_chunk_size = attr.ib(default=0)
                 # Should we display debug information about delta computation
                 debug_delta = attr.ib(default=False)
                 # trust incoming delta by default
                 lazy_delta = attr.ib(default=True)
                 # trust the base of incoming delta by default
                 lazy_delta_base = attr.ib(default=False)
             class revlog:
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 If checkambig, indexfile is opened with checkambig=True at
                 writing, to avoid file stat ambiguity.
                 If mmaplargeindex is True, and an mmapindexthreshold is set, the
                 index will be mmapped rather than read if it is larger than the
                 configured threshold.
                 If censorable is True, the revlog can have censored revisions.
                 If `upperboundcomp` is not None, this is the expected maximal gain from
                 compression for the data content.
                 `concurrencychecker` is an optional function that receives 3 arguments: a
                 file handle, a filename, and an expected position. It should check whether
                 the current position in the file handle is valid, and log/warn/fail (by
                 raising).
                 See mercurial/revlogutils/contants.py for details about the content of an
                 index entry.
                 """
                 _flagserrorclass = error.RevlogError
                 @staticmethod
                 def is_inline_index(header_bytes):
                     """Determine if a revlog is inline from the initial bytes of the index"""
                     header = INDEX_HEADER.unpack(header_bytes)[0]
                     _format_flags = header & ~0xFFFF
                     _format_version = header & 0xFFFF
                     features = FEATURES_BY_VERSION[_format_version]
                     return features[b'inline'](_format_flags)
                 def __init__(
                     self,
                     opener,
                     target,
                     radix,
                     postfix=None,  # only exist for `tmpcensored` now
                     checkambig=False,
                     mmaplargeindex=False,
                     censorable=False,
                     upperboundcomp=None,
                     persistentnodemap=False,
                     concurrencychecker=None,
                     trypending=False,
                     try_split=False,
                     canonical_parent_order=True,
                 ):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     `target`: a (KIND, ID) tuple that identify the content stored in
                     this revlog. It help the rest of the code to understand what the revlog
                     is about without having to resort to heuristic and index filename
                     analysis. Note: that this must be reliably be set by normal code, but
                     that test, debug, or performance measurement code might not set this to
                     accurate value.
                     """
                     self.upperboundcomp = upperboundcomp
                     self.radix = radix
                     self._docket_file = None
                     self._indexfile = None
                     self._datafile = None
                     self._sidedatafile = None
                     self._nodemap_file = None
                     self.postfix = postfix
                     self._trypending = trypending
                     self._try_split = try_split
                     self.opener = opener
                     if persistentnodemap:
                         self._nodemap_file = nodemaputil.get_nodemap_file(self)
                     assert target[0] in ALL_KINDS
                     assert len(target) == 2
                     self.target = target
                     if b'feature-config' in self.opener.options:
                         self.feature_config = self.opener.options[b'feature-config'].copy()
                     else:
                         self.feature_config = FeatureConfig()
                     self.feature_config.censorable = censorable
                     self.feature_config.canonical_parent_order = canonical_parent_order
                     if b'data-config' in self.opener.options:
                         self.data_config = self.opener.options[b'data-config'].copy()
                     else:
                         self.data_config = DataConfig()
                     self.data_config.check_ambig = checkambig
                     self.data_config.mmap_large_index = mmaplargeindex
                     if b'delta-config' in self.opener.options:
                         self.delta_config = self.opener.options[b'delta-config'].copy()
                     else:
                         self.delta_config = DeltaConfig()
                     # 3-tuple of (node, rev, text) for a raw revision.
                     self._revisioncache = None
                     # Maps rev to chain base rev.
                     self._chainbasecache = util.lrucachedict(100)
                     # 2-tuple of (offset, data) of raw data from the revlog at an offset.
                     self._chunkcache = (0, b'')
                     self.index = None
                     self._docket = None
                     self._nodemap_docket = None
                     # Mapping of partial identifiers to full nodes.
                     self._pcache = {}
                     # other optionnals features
                     # Make copy of flag processors so each revlog instance can support
                     # custom flags.
                     self._flagprocessors = dict(flagutil.flagprocessors)
                     # 3-tuple of file handles being used for active writing.
                     self._writinghandles = None
                     # prevent nesting of addgroup
                     self._adding_group = None
                     self._loadindex()
                     self._concurrencychecker = concurrencychecker
                 @property
                 def _generaldelta(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.general_delta
                 @property
                 def _checkambig(self):
                     """temporary compatibility proxy"""
                     return self.data_config.check_ambig
                 @property
                 def _mmaplargeindex(self):
                     """temporary compatibility proxy"""
                     return self.data_config.mmap_large_index
                 @property
                 def _censorable(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.censorable
                 @property
                 def _chunkcachesize(self):
                     """temporary compatibility proxy"""
                     return self.data_config.chunk_cache_size
                 @property
                 def _maxchainlen(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.max_chain_len
                 @property
                 def _deltabothparents(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.delta_both_parents
                 @property
                 def _candidate_group_chunk_size(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.candidate_group_chunk_size
                 @property
                 def _debug_delta(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.debug_delta
                 @property
                 def _compengine(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.compression_engine
                 @property
                 def _compengineopts(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.compression_engine_options
                 @property
                 def _maxdeltachainspan(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.max_deltachain_span
                 @property
                 def _withsparseread(self):
                     """temporary compatibility proxy"""
                     return self.data_config.with_sparse_read
                 @property
                 def _sparserevlog(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.sparse_revlog
                 @property
                 def hassidedata(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.has_side_data
                 @property
                 def _srdensitythreshold(self):
                     """temporary compatibility proxy"""
                     return self.data_config.sr_density_threshold
                 @property
                 def _srmingapsize(self):
                     """temporary compatibility proxy"""
                     return self.data_config.sr_min_gap_size
                 @property
                 def _compute_rank(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.compute_rank
                 @property
                 def canonical_parent_order(self):
                     """temporary compatibility proxy"""
                     return self.feature_config.canonical_parent_order
                 @property
                 def _lazydelta(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.lazy_delta
                 @property
                 def _lazydeltabase(self):
                     """temporary compatibility proxy"""
                     return self.delta_config.lazy_delta_base
                 def _init_opts(self):
                     """process options (from above/config) to setup associated default revlog mode
                     These values might be affected when actually reading on disk information.
                     The relevant values are returned for use in _loadindex().
                     * newversionflags:
                         version header to use if we need to create a new revlog
                     * mmapindexthreshold:
                         minimal index size for start to use mmap
                     * force_nodemap:
                         force the usage of a "development" version of the nodemap code
                     """
                     opts = self.opener.options
                     if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:
                         new_header = CHANGELOGV2
                         compute_rank = opts.get(b'changelogv2.compute-rank', True)
                         self.feature_config.compute_rank = compute_rank
                     elif b'revlogv2' in opts:
                         new_header = REVLOGV2
                     elif b'revlogv1' in opts:
                         new_header = REVLOGV1 | FLAG_INLINE_DATA
                         if b'generaldelta' in opts:
                             new_header |= FLAG_GENERALDELTA
                     elif b'revlogv0' in self.opener.options:
                         new_header = REVLOGV0
                     else:
                         new_header = REVLOG_DEFAULT_VERSION
                     mmapindexthreshold = None
                     if self.data_config.mmap_large_index:
                         mmapindexthreshold = self.data_config.mmap_index_threshold
                     if self.feature_config.enable_ellipsis:
                         self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor
                     # revlog v0 doesn't have flag processors
                     for flag, processor in opts.get(b'flagprocessors', {}).items():
                         flagutil.insertflagprocessor(flag, processor, self._flagprocessors)
                     chunk_cache_size = self.data_config.chunk_cache_size
                     if chunk_cache_size <= 0:
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not greater than 0')
                             % chunk_cache_size
                         )
                     elif chunk_cache_size & (chunk_cache_size - 1):
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not a power of 2')
                             % chunk_cache_size
                         )
                     force_nodemap = opts.get(b'devel-force-nodemap', False)
                     return new_header, mmapindexthreshold, force_nodemap
                 def _get_data(self, filepath, mmap_threshold, size=None):
                     """return a file content with or without mmap
                     If the file is missing return the empty string"""
                     try:
                         with self.opener(filepath) as fp:
                             if mmap_threshold is not None:
                                 file_size = self.opener.fstat(fp).st_size
                                 if file_size >= mmap_threshold:
                                     if size is not None:
                                         # avoid potentiel mmap crash
                                         size = min(file_size, size)
                                     # TODO: should .close() to release resources without
                                     # relying on Python GC
                                     if size is None:
                                         return util.buffer(util.mmapread(fp))
                                     else:
                                         return util.buffer(util.mmapread(fp, size))
                             if size is None:
                                 return fp.read()
                             else:
                                 return fp.read(size)
                     except FileNotFoundError:
                         return b''
                 def get_streams(self, max_linkrev, force_inline=False):
                     """return a list of streams that represent this revlog
                     This is used by stream-clone to do bytes to bytes copies of a repository.
                     This streams data for all revisions that refer to a changelog revision up
                     to `max_linkrev`.
                     If `force_inline` is set, it enforces that the stream will represent an inline revlog.
                     It returns is a list of three-tuple:
                         [
                             (filename, bytes_stream, stream_size),
                             …
                         ]
                     """
                     n = len(self)
                     index = self.index
                     while n > 0:
                         linkrev = index[n - 1][4]
                         if linkrev < max_linkrev:
                             break
                         # note: this loop will rarely go through multiple iterations, since
                         # it only traverses commits created during the current streaming
                         # pull operation.
                         #
                         # If this become a problem, using a binary search should cap the
                         # runtime of this.
                         n = n - 1
                     if n == 0:
                         # no data to send
                         return []
                     index_size = n * index.entry_size
                     data_size = self.end(n - 1)
                     # XXX we might have been split (or stripped) since the object
                     # initialization, We need to close this race too, but having a way to
                     # pre-open the file we feed to the revlog and never closing them before
                     # we are done streaming.
                     if self._inline:
                         def get_stream():
                             with self._indexfp() as fp:
                                 yield None
                                 size = index_size + data_size
                                 if size <= 65536:
                                     yield fp.read(size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=size)
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     elif force_inline:
                         def get_stream():
                             with self.reading():
                                 yield None
                                 for rev in range(n):
                                     idx = self.index.entry_binary(rev)
                                     if rev == 0 and self._docket is None:
                                         # re-inject the inline flag
                                         header = self._format_flags
                                         header |= self._format_version
                                         header |= FLAG_INLINE_DATA
                                         header = self.index.pack_header(header)
                                         idx = header + idx
                                     yield idx
                                     yield self._getsegmentforrevs(rev, rev)[1]
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     else:
                         def get_index_stream():
                             with self._indexfp() as fp:
                                 yield None
                                 if index_size <= 65536:
                                     yield fp.read(index_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=index_size)
                         def get_data_stream():
                             with self._datafp() as fp:
                                 yield None
                                 if data_size <= 65536:
                                     yield fp.read(data_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=data_size)
                         index_stream = get_index_stream()
                         next(index_stream)
                         data_stream = get_data_stream()
                         next(data_stream)
                         return [
                             (self._datafile, data_stream, data_size),
                             (self._indexfile, index_stream, index_size),
                         ]
                 def _loadindex(self, docket=None):
                     new_header, mmapindexthreshold, force_nodemap = self._init_opts()
                     if self.postfix is not None:
                         entry_point = b'%s.i.%s' % (self.radix, self.postfix)
                     elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):
                         entry_point = b'%s.i.a' % self.radix
                     elif self._try_split and self.opener.exists(self._split_index_file):
                         entry_point = self._split_index_file
                     else:
                         entry_point = b'%s.i' % self.radix
                     if docket is not None:
                         self._docket = docket
                         self._docket_file = entry_point
                     else:
                         self._initempty = True
                         entry_data = self._get_data(entry_point, mmapindexthreshold)
                         if len(entry_data) > 0:
                             header = INDEX_HEADER.unpack(entry_data[:4])[0]
                             self._initempty = False
                         else:
                             header = new_header
                         self._format_flags = header & ~0xFFFF
                         self._format_version = header & 0xFFFF
                         supported_flags = SUPPORTED_FLAGS.get(self._format_version)
                         if supported_flags is None:
                             msg = _(b'unknown version (%d) in revlog %s')
                             msg %= (self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         elif self._format_flags & ~supported_flags:
                             msg = _(b'unknown flags (%#04x) in version %d revlog %s')
                             display_flag = self._format_flags >> 16
                             msg %= (display_flag, self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         features = FEATURES_BY_VERSION[self._format_version]
                         self._inline = features[b'inline'](self._format_flags)
                         self.delta_config.general_delta = features[b'generaldelta'](
                             self._format_flags
                         )
                         self.feature_config.has_side_data = features[b'sidedata']
                         if not features[b'docket']:
                             self._indexfile = entry_point
                             index_data = entry_data
                         else:
                             self._docket_file = entry_point
                             if self._initempty:
                                 self._docket = docketutil.default_docket(self, header)
                             else:
                                 self._docket = docketutil.parse_docket(
                                     self, entry_data, use_pending=self._trypending
                                 )
                     if self._docket is not None:
                         self._indexfile = self._docket.index_filepath()
                         index_data = b''
                         index_size = self._docket.index_end
                         if index_size > 0:
                             index_data = self._get_data(
                                 self._indexfile, mmapindexthreshold, size=index_size
                             )
                             if len(index_data) < index_size:
                                 msg = _(b'too few index data for %s: got %d, expected %d')
                                 msg %= (self.display_id, len(index_data), index_size)
                                 raise error.RevlogError(msg)
                         self._inline = False
                         # generaldelta implied by version 2 revlogs.
                         self.delta_config.general_delta = True
                         # the logic for persistent nodemap will be dealt with within the
                         # main docket, so disable it for now.
                         self._nodemap_file = None
                     if self._docket is not None:
                         self._datafile = self._docket.data_filepath()
                         self._sidedatafile = self._docket.sidedata_filepath()
                     elif self.postfix is None:
                         self._datafile = b'%s.d' % self.radix
                     else:
                         self._datafile = b'%s.d.%s' % (self.radix, self.postfix)
                     self.nodeconstants = sha1nodeconstants
                     self.nullid = self.nodeconstants.nullid
                     # sparse-revlog can't be on without general-delta (issue6056)
                     if not self.delta_config.general_delta:
                         self.delta_config.sparse_revlog = False
                     self._storedeltachains = True
                     devel_nodemap = (
                         self._nodemap_file
                         and force_nodemap
                         and parse_index_v1_nodemap is not None
                     )
                     use_rust_index = False
                     if rustrevlog is not None:
                         if self._nodemap_file is not None:
                             use_rust_index = True
                         else:
                             use_rust_index = self.opener.options.get(b'rust.index')
                     self._parse_index = parse_index_v1
                     if self._format_version == REVLOGV0:
                         self._parse_index = revlogv0.parse_index_v0
                     elif self._format_version == REVLOGV2:
                         self._parse_index = parse_index_v2
                     elif self._format_version == CHANGELOGV2:
                         self._parse_index = parse_index_cl_v2
                     elif devel_nodemap:
                         self._parse_index = parse_index_v1_nodemap
                     elif use_rust_index:
                         self._parse_index = parse_index_v1_mixed
                     try:
                         d = self._parse_index(index_data, self._inline)
                         index, chunkcache = d
                         use_nodemap = (
                             not self._inline
                             and self._nodemap_file is not None
                             and hasattr(index, 'update_nodemap_data')
                         )
                         if use_nodemap:
                             nodemap_data = nodemaputil.persisted_data(self)
                             if nodemap_data is not None:
                                 docket = nodemap_data[0]
                                 if (
                                     len(d[0]) > docket.tip_rev
                                     and d[0][docket.tip_rev][7] == docket.tip_node
                                 ):
                                     # no changelog tampering
                                     self._nodemap_docket = docket
                                     index.update_nodemap_data(*nodemap_data)
                     except (ValueError, IndexError):
                         raise error.RevlogError(
                             _(b"index %s is corrupted") % self.display_id
                         )
                     self.index = index
                     self._segmentfile = randomaccessfile.randomaccessfile(
                         self.opener,
                         (self._indexfile if self._inline else self._datafile),
                         self.data_config.chunk_cache_size,
                         chunkcache,
                     )
                     self._segmentfile_sidedata = randomaccessfile.randomaccessfile(
                         self.opener,
                         self._sidedatafile,
                         self.data_config.chunk_cache_size,
                     )
                     # revnum -> (chain-length, sum-delta-length)
                     self._chaininfocache = util.lrucachedict(500)
                     # revlog header -> revlog compressor
                     self._decompressors = {}
                 def get_revlog(self):
                     """simple function to mirror API of other not-really-revlog API"""
                     return self
                 @util.propertycache
                 def revlog_kind(self):
                     return self.target[0]
                 @util.propertycache
                 def display_id(self):
                     """The public facing "ID" of the revlog that we use in message"""
                     if self.revlog_kind == KIND_FILELOG:
                         # Reference the file without the "data/" prefix, so it is familiar
                         # to the user.
                         return self.target[1]
                     else:
                         return self.radix
                 def _get_decompressor(self, t):
                     try:
                         compressor = self._decompressors[t]
                     except KeyError:
                         try:
                             engine = util.compengines.forrevlogheader(t)
                             compressor = engine.revlogcompressor(
                                 self.feature_config.compression_engine_options
                             )
                             self._decompressors[t] = compressor
                         except KeyError:
                             raise error.RevlogError(
                                 _(b'unknown compression type %s') % binascii.hexlify(t)
                             )
                     return compressor
                 @util.propertycache
                 def _compressor(self):
                     engine = util.compengines[self.feature_config.compression_engine]
                     return engine.revlogcompressor(
                         self.feature_config.compression_engine_options
                     )
                 @util.propertycache
                 def _decompressor(self):
                     """the default decompressor"""
                     if self._docket is None:
                         return None
                     t = self._docket.default_compression_header
                     c = self._get_decompressor(t)
                     return c.decompress
                 def _indexfp(self):
                     """file object for the revlog's index file"""
                     return self.opener(self._indexfile, mode=b"r")
                 def __index_write_fp(self):
                     # You should not use this directly and use `_writing` instead
                     try:
                         f = self.opener(
                             self._indexfile,
                             mode=b"r+",
                             checkambig=self.data_config.check_ambig,
                         )
                         if self._docket is None:
                             f.seek(0, os.SEEK_END)
                         else:
                             f.seek(self._docket.index_end, os.SEEK_SET)
                         return f
                     except FileNotFoundError:
                         return self.opener(
                             self._indexfile,
                             mode=b"w+",
                             checkambig=self.data_config.check_ambig,
                         )
                 def __index_new_fp(self):
                     # You should not use this unless you are upgrading from inline revlog
                     return self.opener(
                         self._indexfile,
                         mode=b"w",
                         checkambig=self.data_config.check_ambig,
                         atomictemp=True,
                     )
                 def _datafp(self, mode=b'r'):
                     """file object for the revlog's data file"""
                     return self.opener(self._datafile, mode=mode)
                 @contextlib.contextmanager
                 def _sidedatareadfp(self):
                     """file object suitable to read sidedata"""
                     if self._writinghandles:
                         yield self._writinghandles[2]
                     else:
                         with self.opener(self._sidedatafile) as fp:
                             yield fp
                 def tiprev(self):
                     return len(self.index) - 1
                 def tip(self):
                     return self.node(self.tiprev())
                 def __contains__(self, rev):
                     return 0 <= rev < len(self)
                 def __len__(self):
                     return len(self.index)
                 def __iter__(self):
                     return iter(range(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     return storageutil.iterrevs(len(self), start=start, stop=stop)
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def _candelta(self, baserev, rev):
                     """whether two revisions (baserev, rev) can be delta-ed or not"""
                     # Disable delta if either rev requires a content-changing flag
                     # processor (ex. LFS). This is because such flag processor can alter
                     # the rawtext content that the delta will be based on, and two clients
                     # could have a same revlog node with different flags (i.e. different
                     # rawtext contents) and the delta could be incompatible.
                     if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (
                         self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS
                     ):
                         return False
                     return True
                 def update_caches(self, transaction):
                     """update on disk cache
                     If a transaction is passed, the update may be delayed to transaction
                     commit."""
                     if self._nodemap_file is not None:
                         if transaction is None:
                             nodemaputil.update_persistent_nodemap(self)
                         else:
                             nodemaputil.setup_persistent_nodemap(transaction, self)
                 def clearcaches(self):
                     """Clear in-memory caches"""
                     self._revisioncache = None
                     self._chainbasecache.clear()
                     self._segmentfile.clear_cache()
                     self._segmentfile_sidedata.clear_cache()
                     self._pcache = {}
                     self._nodemap_docket = None
                     self.index.clearcaches()
                     # The python code is the one responsible for validating the docket, we
                     # end up having to refresh it here.
                     use_nodemap = (
                         not self._inline
                         and self._nodemap_file is not None
                         and hasattr(self.index, 'update_nodemap_data')
                     )
                     if use_nodemap:
                         nodemap_data = nodemaputil.persisted_data(self)
                         if nodemap_data is not None:
                             self._nodemap_docket = nodemap_data[0]
                             self.index.update_nodemap_data(*nodemap_data)
                 def rev(self, node):
                     """return the revision number associated with a <nodeid>"""
                     try:
                         return self.index.rev(node)
                     except TypeError:
                         raise
                     except error.RevlogError:
                         # parsers.c radix tree lookup failed
                         if (
                             node == self.nodeconstants.wdirid
                             or node in self.nodeconstants.wdirfilenodeids
                         ):
                             raise error.WdirUnsupported
                         raise error.LookupError(node, self.display_id, _(b'no node'))
                 # Accessors for index entries.
                 # First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
                 # are flags.
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def sidedata_cut_off(self, rev):
                     sd_cut_off = self.index[rev][8]
                     if sd_cut_off != 0:
                         return sd_cut_off
                     # This is some annoying dance, because entries without sidedata
                     # currently use 0 as their ofsset. (instead of previous-offset +
                     # previous-size)
                     #
                     # We should reconsider this sidedata → 0 sidata_offset policy.
                     # In the meantime, we need this.
                     while 0 <= rev:
                         e = self.index[rev]
                         if e[9] != 0:
                             return e[8] + e[9]
                         rev -= 1
                     return 0
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def length(self, rev):
                     return self.index[rev][1]
                 def sidedata_length(self, rev):
                     if not self.feature_config.has_side_data:
                         return 0
                     return self.index[rev][9]
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.rawdata(rev)
                     return len(t)
                 def size(self, rev):
                     """length of non-raw text (processed by a "read" flag processor)"""
                     # fast path: if no "read" flag processor could change the content,
                     # size is rawsize. note: ELLIPSIS is known to not change the content.
                     flags = self.flags(rev)
                     if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
                         return self.rawsize(rev)
                     return len(self.revision(rev))
                 def fast_rank(self, rev):
                     """Return the rank of a revision if already known, or None otherwise.
                     The rank of a revision is the size of the sub-graph it defines as a
                     head. Equivalently, the rank of a revision `r` is the size of the set
                     `ancestors(r)`, `r` included.
                     This method returns the rank retrieved from the revlog in constant
                     time. It makes no attempt at computing unknown values for versions of
                     the revlog which do not persist the rank.
                     """
                     rank = self.index[rev][ENTRY_RANK]
                     if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:
                         return None
                     if rev == nullrev:
                         return 0  # convention
                     return rank
                 def chainbase(self, rev):
                     base = self._chainbasecache.get(rev)
                     if base is not None:
                         return base
                     index = self.index
                     iterrev = rev
                     base = index[iterrev][3]
                     while base != iterrev:
                         iterrev = base
                         base = index[iterrev][3]
                     self._chainbasecache[rev] = base
                     return base
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parentrevs(self, rev):
                     try:
                         entry = self.index[rev]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                     if self.canonical_parent_order and entry[5] == nullrev:
                         return entry[6], entry[5]
                     else:
                         return entry[5], entry[6]
                 # fast parentrevs(rev) where rev isn't filtered
                 _uncheckedparentrevs = parentrevs
                 def node(self, rev):
                     try:
                         return self.index[rev][7]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                 # Derived from index values.
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     # inline node() to avoid function call overhead
                     if self.canonical_parent_order and d[5] == self.nullid:
                         return i[d[6]][7], i[d[5]][7]
                     else:
                         return i[d[5]][7], i[d[6]][7]
                 def chainlen(self, rev):
                     return self._chaininfo(rev)[0]
                 def _chaininfo(self, rev):
                     chaininfocache = self._chaininfocache
                     if rev in chaininfocache:
                         return chaininfocache[rev]
                     index = self.index
                     generaldelta = self.delta_config.general_delta
                     iterrev = rev
                     e = index[iterrev]
                     clen = 0
                     compresseddeltalen = 0
                     while iterrev != e[3]:
                         clen += 1
                         compresseddeltalen += e[1]
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         if iterrev in chaininfocache:
                             t = chaininfocache[iterrev]
                             clen += t[0]
                             compresseddeltalen += t[1]
                             break
                         e = index[iterrev]
                     else:
                         # Add text length of base since decompressing that also takes
                         # work. For cache hits the length is already included.
                         compresseddeltalen += e[1]
                     r = (clen, compresseddeltalen)
                     chaininfocache[rev] = r
                     return r
                 def _deltachain(self, rev, stoprev=None):
                     """Obtain the delta chain for a revision.
                     ``stoprev`` specifies a revision to stop at. If not specified, we
                     stop at the base of the chain.
                     Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
                     revs in ascending order and ``stopped`` is a bool indicating whether
                     ``stoprev`` was hit.
                     """
                     generaldelta = self.delta_config.general_delta
                     # Try C implementation.
                     try:
                         return self.index.deltachain(rev, stoprev, generaldelta)
                     except AttributeError:
                         pass
                     chain = []
                     # Alias to prevent attribute lookup in tight loop.
                     index = self.index
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != stoprev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == stoprev:
                         stopped = True
                     else:
                         chain.append(iterrev)
                         stopped = False
                     chain.reverse()
                     return chain, stopped
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse revision order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     # first, make sure start revisions aren't filtered
                     revs = list(revs)
                     checkrev = self.node
                     for r in revs:
                         checkrev(r)
                     # and we're sure ancestors aren't filtered as well
                     if rustancestor is not None and self.index.rust_ext_compat:
                         lazyancestors = rustancestor.LazyAncestors
                         arg = self.index
                     else:
                         lazyancestors = ancestor.lazyancestors
                         arg = self._uncheckedparentrevs
                     return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)
                 def descendants(self, revs):
                     return dagop.descendantrevs(revs, self.revs, self.parentrevs)
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset:
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = collections.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(miss) for miss in missing]
                 def incrementalmissingrevs(self, common=None):
                     """Return an object that can be used to incrementally compute the
                     revision numbers of the ancestors of arbitrary sets that are not
                     ancestors of common. This is an ancestor.incrementalmissingancestors
                     object.
                     'common' is a list of revision numbers. If common is not supplied, uses
                     nullrev.
                     """
                     if common is None:
                         common = [nullrev]
                     if rustancestor is not None and self.index.rust_ext_compat:
                         return rustancestor.MissingAncestors(self.index, common)
                     return ancestor.incrementalmissingancestors(self.parentrevs, common)
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     inc = self.incrementalmissingrevs(common=common)
                     return inc.missingancestors(heads)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     inc = self.incrementalmissingrevs(common=common)
                     return [self.node(r) for r in inc.missingancestors(heads)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [self.nullid]  # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return (
                             [self.node(r) for r in self],
                             [self.nullid],
                             list(self.heads()),
                         )
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == self.nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n)  # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update(
                                         [p for p in self.parents(n) if p != self.nullid]
                                     )
                                 elif n in heads:  # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [root for root in roots if root in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(root) for root in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [self.nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [head for head, flag in heads.items() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self, revs=None):
                     if revs is None:
                         try:
                             return self.index.headrevs()
                         except AttributeError:
                             return self._headrevs()
                     if rustdagop is not None and self.index.rust_ext_compat:
                         return rustdagop.headrevs(self.index, revs)
                     return dagop.headrevs(revs, self._uncheckedparentrevs)
                 def computephases(self, roots):
                     return self.index.computephasesmapsets(roots)
                 def _headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     # we won't iter over filtered rev so nobody is a head at start
                     ishead = [0] * (count + 1)
                     index = self.index
                     for r in self:
                         ishead[r] = 1  # I may be an head
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                     return [r for r, val in enumerate(ishead) if val]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [self.nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullrev
                     else:
                         start = self.rev(start)
                     stoprevs = {self.rev(n) for n in stop or []}
                     revs = dagop.headrevssubset(
                         self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs
                     )
                     return [self.node(rev) for rev in revs]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     ancs = self._commonancestorsheads(a, b)
                     return pycompat.maplist(self.node, ancs)
                 def _commonancestorsheads(self, *revs):
                     """calculate all the heads of the common ancestors of revs"""
                     try:
                         ancs = self.index.commonancestorsheads(*revs)
                     except (AttributeError, OverflowError):  # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
                     return ancs
                 def isancestor(self, a, b):
                     """return True if node a is an ancestor of node b
                     A revision is considered an ancestor of itself."""
                     a, b = self.rev(a), self.rev(b)
                     return self.isancestorrev(a, b)
                 def isancestorrev(self, a, b):
                     """return True if revision a is an ancestor of revision b
                     A revision is considered an ancestor of itself.
                     The implementation of this is trivial but the use of
                     reachableroots is not."""
                     if a == nullrev:
                         return True
                     elif a == b:
                         return True
                     elif a > b:
                         return False
                     return bool(self.reachableroots(a, [b], [a], includepath=False))
                 def reachableroots(self, minroot, heads, roots, includepath=False):
                     """return (heads(::(<roots> and <roots>::<heads>)))
                     If includepath is True, return (<roots>::<heads>)."""
                     try:
                         return self.index.reachableroots2(
                             minroot, heads, roots, includepath
                         )
                     except AttributeError:
                         return dagop._reachablerootspure(
                             self.parentrevs, minroot, roots, heads, includepath
                         )
                 def ancestor(self, a, b):
                     """calculate the "best" common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)
                     except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
                         return min(map(self.node, ancs))
                     return self.nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == self.nodeconstants.nodelen:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node)  # quick search the index
                             return node
                         except error.LookupError:
                             pass  # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if b"%d" % rev != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 2 * self.nodeconstants.nodelen:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (binascii.Error, error.LookupError):
                             pass
                 def _partialmatch(self, id):
                     # we don't care wdirfilenodeids as they should be always full hash
                     maybewdir = self.nodeconstants.wdirhex.startswith(id)
                     ambiguous = False
                     try:
                         partial = self.index.partialmatch(id)
                         if partial and self.hasnode(partial):
                             if maybewdir:
                                 # single 'ff...' match in radix tree, ambiguous with wdir
                                 ambiguous = True
                             else:
                                 return partial
                         elif maybewdir:
                             # no 'ff...' match in radix tree, wdir identified
                             raise error.WdirUnsupported
                         else:
                             return None
                     except error.RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fast path: for unfiltered changelog, radix tree is accurate
                         if not getattr(self, 'filteredrevs', None):
                             ambiguous = True
                         # fall through to slow path that filters hidden revisions
                     except (AttributeError, ValueError):
                         # we are pure python, or key is not hex
                         pass
                     if ambiguous:
                         raise error.AmbiguousPrefixLookupError(
                             id, self.display_id, _(b'ambiguous identifier')
                         )
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) <= 40:
                         # hex(node)[:...]
                         l = len(id) // 2 * 2  # grab an even number of digits
                         try:
                             # we're dropping the last digit, so let's check that it's hex,
                             # to avoid the expensive computation below if it's not
                             if len(id) % 2 > 0:
                                 if not (id[-1] in hexdigits):
                                     return None
                             prefix = bin(id[:l])
                         except binascii.Error:
                             pass
                         else:
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [
                                 n for n in nl if hex(n).startswith(id) and self.hasnode(n)
                             ]
                             if self.nodeconstants.nullhex.startswith(id):
                                 nl.append(self.nullid)
                             if len(nl) > 0:
                                 if len(nl) == 1 and not maybewdir:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise error.AmbiguousPrefixLookupError(
                                     id, self.display_id, _(b'ambiguous identifier')
                                 )
                             if maybewdir:
                                 raise error.WdirUnsupported
                             return None
                 def lookup(self, id):
                     """locate a node based on:
                     - revision number or str(revision number)
                     - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise error.LookupError(id, self.display_id, _(b'no match found'))
                 def shortest(self, node, minlength=1):
                     """Find the shortest unambiguous prefix that matches node."""
                     def isvalid(prefix):
                         try:
                             matchednode = self._partialmatch(prefix)
                         except error.AmbiguousPrefixLookupError:
                             return False
                         except error.WdirUnsupported:
                             # single 'ff...' match
                             return True
                         if matchednode is None:
                             raise error.LookupError(node, self.display_id, _(b'no node'))
                         return True
                     def maybewdir(prefix):
                         return all(c == b'f' for c in pycompat.iterbytestr(prefix))
                     hexnode = hex(node)
                     def disambiguate(hexnode, minlength):
                         """Disambiguate against wdirid."""
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if not maybewdir(prefix):
                                 return prefix
                     if not getattr(self, 'filteredrevs', None):
                         try:
                             length = max(self.index.shortest(node), minlength)
                             return disambiguate(hexnode, length)
                         except error.RevlogError:
                             if node != self.nodeconstants.wdirid:
                                 raise error.LookupError(
                                     node, self.display_id, _(b'no node')
                                 )
                         except AttributeError:
                             # Fall through to pure code
                             pass
                     if node == self.nodeconstants.wdirid:
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if isvalid(prefix):
                                 return prefix
                     for length in range(minlength, len(hexnode) + 1):
                         prefix = hexnode[:length]
                         if isvalid(prefix):
                             return disambiguate(hexnode, length)
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return storageutil.hashrevisionsha1(text, p1, p2) != node
                 def _getsegmentforrevs(self, startrev, endrev):
                     """Obtain a segment of raw data corresponding to a range of revisions.
                     Accepts the start and end revisions and an optional already-open
                     file handle to be used for reading. If the file handle is read, its
                     seek position will not be preserved.
                     Requests for data may be satisfied by a cache.
                     Returns a 2-tuple of (offset, data) for the requested range of
                     revisions. Offset is the integer offset from the beginning of the
                     revlog and data is a str or buffer of the raw byte data.
                     Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
                     to determine where each revision's data begins and ends.
                     """
                     # Inlined self.start(startrev) & self.end(endrev) for perf reasons
                     # (functions are expensive).
                     index = self.index
                     istart = index[startrev]
                     start = int(istart[0] >> 16)
                     if startrev == endrev:
                         end = start + istart[1]
                     else:
                         iend = index[endrev]
                         end = int(iend[0] >> 16) + iend[1]
                     if self._inline:
                         start += (startrev + 1) * self.index.entry_size
                         end += (endrev + 1) * self.index.entry_size
                     length = end - start
                     return start, self._segmentfile.read_chunk(start, length)
                 def _chunk(self, rev):
                     """Obtain a single decompressed chunk for a revision.
                     Accepts an integer revision and an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will not
                     be preserved.
                     Returns a str holding uncompressed data for the requested revision.
                     """
                     compression_mode = self.index[rev][10]
                     data = self._getsegmentforrevs(rev, rev)[1]
                     if compression_mode == COMP_MODE_PLAIN:
                         return data
                     elif compression_mode == COMP_MODE_DEFAULT:
                         return self._decompressor(data)
                     elif compression_mode == COMP_MODE_INLINE:
                         return self.decompress(data)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= compression_mode
                         raise error.RevlogError(msg)
                 def _chunks(self, revs, targetsize=None):
                     """Obtain decompressed chunks for the specified revisions.
                     Accepts an iterable of numeric revisions that are assumed to be in
                     ascending order. Also accepts an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will
                     not be preserved.
                     This function is similar to calling ``self._chunk()`` multiple times,
                     but is faster.
                     Returns a list with decompressed data for each requested revision.
                     """
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self._inline
                     iosize = self.index.entry_size
                     buffer = util.buffer
                     l = []
                     ladd = l.append
                     if not self.data_config.with_sparse_read:
                         slicedchunks = (revs,)
                     else:
                         slicedchunks = deltautil.slicechunk(
                             self, revs, targetsize=targetsize
                         )
                     for revschunk in slicedchunks:
                         firstrev = revschunk[0]
                         # Skip trailing revisions with empty diff
                         for lastrev in revschunk[::-1]:
                             if length(lastrev) != 0:
                                 break
                         try:
                             offset, data = self._getsegmentforrevs(firstrev, lastrev)
                         except OverflowError:
                             # issue4215 - we can't cache a run of chunks greater than
                             # 2G on Windows
                             return [self._chunk(rev) for rev in revschunk]
                         decomp = self.decompress
                         # self._decompressor might be None, but will not be used in that case
                         def_decomp = self._decompressor
                         for rev in revschunk:
                             chunkstart = start(rev)
                             if inline:
                                 chunkstart += (rev + 1) * iosize
                             chunklength = length(rev)
                             comp_mode = self.index[rev][10]
                             c = buffer(data, chunkstart - offset, chunklength)
                             if comp_mode == COMP_MODE_PLAIN:
                                 ladd(c)
                             elif comp_mode == COMP_MODE_INLINE:
                                 ladd(decomp(c))
                             elif comp_mode == COMP_MODE_DEFAULT:
                                 ladd(def_decomp(c))
                             else:
                                 msg = b'unknown compression mode %d'
                                 msg %= comp_mode
                                 raise error.RevlogError(msg)
                     return l
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self.delta_config.general_delta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     if not self.delta_config.sparse_revlog:
                         return self.deltaparent(rev) == nullrev
                     elif hasattr(self.index, 'issnapshot'):
                         # directly assign the method to cache the testing and access
                         self.issnapshot = self.index.issnapshot
                         return self.issnapshot(rev)
                     if rev == nullrev:
                         return True
                     entry = self.index[rev]
                     base = entry[3]
                     if base == rev:
                         return True
                     if base == nullrev:
                         return True
                     p1 = entry[5]
                     while self.length(p1) == 0:
                         b = self.deltaparent(p1)
                         if b == p1:
                             break
                         p1 = b
                     p2 = entry[6]
                     while self.length(p2) == 0:
                         b = self.deltaparent(p2)
                         if b == p2:
                             break
                         p2 = b
                     if base == p1 or base == p2:
                         return False
                     return self.issnapshot(base)
                 def snapshotdepth(self, rev):
                     """number of snapshot in the chain before this one"""
                     if not self.issnapshot(rev):
                         raise error.ProgrammingError(b'revision %d not a snapshot')
                     return len(self._deltachain(rev)[0]) - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions
                     The delta calculated is in binary form and is intended to be written to
                     revlog data directly. So this function needs raw revision data.
                     """
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return bytes(self._chunk(rev2))
                     return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))
                 def revision(self, nodeorrev):
                     """return an uncompressed revision of a given node or revision
                     number.
                     """
                     return self._revisiondata(nodeorrev)
                 def sidedata(self, nodeorrev):
                     """a map of extra data related to the changeset but not part of the hash
                     This function currently return a dictionary. However, more advanced
                     mapping object will likely be used in the future for a more
                     efficient/lazy code.
                     """
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                     else:
                         rev = self.rev(nodeorrev)
                     return self._sidedata(rev)
                 def _revisiondata(self, nodeorrev, raw=False):
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     # fast path the special `nullid` rev
                     if node == self.nullid:
                         return b""
                     # ``rawtext`` is the text as stored inside the revlog. Might be the
                     # revision or might need to be processed to retrieve the revision.
                     rev, rawtext, validated = self._rawtext(node, rev)
                     if raw and validated:
                         # if we don't want to process the raw text and that raw
                         # text is cached, we can exit early.
                         return rawtext
                     if rev is None:
                         rev = self.rev(node)
                     # the revlog's flag for this revision
                     # (usually alter its state or content)
                     flags = self.flags(rev)
                     if validated and flags == REVIDX_DEFAULT_FLAGS:
                         # no extra flags set, no flag processor runs, text = rawtext
                         return rawtext
                     if raw:
                         validatehash = flagutil.processflagsraw(self, rawtext, flags)
                         text = rawtext
                     else:
                         r = flagutil.processflagsread(self, rawtext, flags)
                         text, validatehash = r
                     if validatehash:
                         self.checkhash(text, node, rev=rev)
                     if not validated:
                         self._revisioncache = (node, rev, rawtext)
                     return text
                 def _rawtext(self, node, rev):
                     """return the possibly unvalidated rawtext for a revision
                     returns (rev, rawtext, validated)
                     """
                     # revision in the cache (could be useful to apply delta)
                     cachedrev = None
                     # An intermediate text to apply deltas to
                     basetext = None
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._revisioncache:
                         if self._revisioncache[0] == node:
                             return (rev, self._revisioncache[2], True)
                         cachedrev = self._revisioncache[1]
                     if rev is None:
                         rev = self.rev(node)
                     chain, stopped = self._deltachain(rev, stoprev=cachedrev)
                     if stopped:
                         basetext = self._revisioncache[2]
                     # drop cache to save memory, the caller is expected to
                     # update self._revisioncache after validating the text
                     self._revisioncache = None
                     targetsize = None
                     rawsize = self.index[rev][2]
                     if 0 <= rawsize:
                         targetsize = 4 * rawsize
                     bins = self._chunks(chain, targetsize=targetsize)
                     if basetext is None:
                         basetext = bytes(bins[0])
                         bins = bins[1:]
                     rawtext = mdiff.patches(basetext, bins)
                     del basetext  # let us have a chance to free memory early
                     return (rev, rawtext, False)
                 def _sidedata(self, rev):
                     """Return the sidedata for a given revision number."""
                     index_entry = self.index[rev]
                     sidedata_offset = index_entry[8]
                     sidedata_size = index_entry[9]
                     if self._inline:
                         sidedata_offset += self.index.entry_size * (1 + rev)
                     if sidedata_size == 0:
                         return {}
                     if self._docket.sidedata_end < sidedata_offset + sidedata_size:
                         filename = self._sidedatafile
                         end = self._docket.sidedata_end
                         offset = sidedata_offset
                         length = sidedata_size
                         m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)
                         raise error.RevlogError(m)
                     comp_segment = self._segmentfile_sidedata.read_chunk(
                         sidedata_offset, sidedata_size
                     )
                     comp = self.index[rev][11]
                     if comp == COMP_MODE_PLAIN:
                         segment = comp_segment
                     elif comp == COMP_MODE_DEFAULT:
                         segment = self._decompressor(comp_segment)
                     elif comp == COMP_MODE_INLINE:
                         segment = self.decompress(comp_segment)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= comp
                         raise error.RevlogError(msg)
                     sidedata = sidedatautil.deserialize_sidedata(segment)
                     return sidedata
                 def rawdata(self, nodeorrev):
                     """return an uncompressed raw data of a given node or revision number."""
                     return self._revisiondata(nodeorrev, raw=True)
                 def hash(self, text, p1, p2):
                     """Compute a node hash.
                     Available as a function so that subclasses can replace the hash
                     as needed.
                     """
                     return storageutil.hashrevisionsha1(text, p1, p2)
                 def checkhash(self, text, node, p1=None, p2=None, rev=None):
                     """Check node hash integrity.
                     Available as a function so that subclasses can extend hash mismatch
                     behaviors as needed.
                     """
                     try:
                         if p1 is None and p2 is None:
                             p1, p2 = self.parents(node)
                         if node != self.hash(text, p1, p2):
                             # Clear the revision cache on hash failure. The revision cache
                             # only stores the raw revision and clearing the cache does have
                             # the side-effect that we won't have a cache hit when the raw
                             # revision data is accessed. But this case should be rare and
                             # it is extra work to teach the cache about the hash
                             # verification state.
                             if self._revisioncache and self._revisioncache[0] == node:
                                 self._revisioncache = None
                             revornode = rev
                             if revornode is None:
                                 revornode = templatefilters.short(hex(node))
                             raise error.RevlogError(
                                 _(b"integrity check failed on %s:%s")
                                 % (self.display_id, pycompat.bytestr(revornode))
                             )
                     except error.RevlogError:
                         if self.feature_config.censorable and storageutil.iscensoredtext(
                             text
                         ):
                             raise error.CensoredNodeError(self.display_id, node, text)
                         raise
                 @property
                 def _split_index_file(self):
                     """the path where to expect the index of an ongoing splitting operation
                     The file will only exist if a splitting operation is in progress, but
                     it is always expected at the same location."""
                     parts = self.radix.split(b'/')
                     if len(parts) > 1:
                         # adds a '-s' prefix to the ``data/` or `meta/` base
                         head = parts[0] + b'-s'
                         mids = parts[1:-1]
                         tail = parts[-1] + b'.i'
                         pieces = [head] + mids + [tail]
                         return b'/'.join(pieces)
                     else:
                         # the revlog is stored at the root of the store (changelog or
                         # manifest), no risk of collision.
                         return self.radix + b'.i.s'
                 def _enforceinlinesize(self, tr, side_write=True):
                     """Check if the revlog is too big for inline and convert if so.
                     This should be called after revisions are added to the revlog. If the
                     revlog has grown too large to be an inline revlog, it will convert it
                     to use multiple index and data files.
                     """
                     tiprev = len(self) - 1
                     total_size = self.start(tiprev) + self.length(tiprev)
                     if not self._inline or total_size < _maxinline:
                         return
                     troffset = tr.findoffset(self._indexfile)
                     if troffset is None:
                         raise error.RevlogError(
                             _(b"%s not found in the transaction") % self._indexfile
                         )
                     if troffset:
                         tr.addbackup(self._indexfile, for_offset=True)
                     tr.add(self._datafile, 0)
                     existing_handles = False
                     if self._writinghandles is not None:
                         existing_handles = True
                         fp = self._writinghandles[0]
                         fp.flush()
                         fp.close()
                         # We can't use the cached file handle after close(). So prevent
                         # its usage.
                         self._writinghandles = None
                         self._segmentfile.writing_handle = None
                         # No need to deal with sidedata writing handle as it is only
                         # relevant with revlog-v2 which is never inline, not reaching
                         # this code
                     if side_write:
                         old_index_file_path = self._indexfile
                         new_index_file_path = self._split_index_file
                         opener = self.opener
                         weak_self = weakref.ref(self)
                         # the "split" index replace the real index when the transaction is finalized
                         def finalize_callback(tr):
                             opener.rename(
                                 new_index_file_path,
                                 old_index_file_path,
                                 checkambig=True,
                             )
                             maybe_self = weak_self()
                             if maybe_self is not None:
                                 maybe_self._indexfile = old_index_file_path
                         def abort_callback(tr):
                             maybe_self = weak_self()
                             if maybe_self is not None:
                                 maybe_self._indexfile = old_index_file_path
                         tr.registertmp(new_index_file_path)
                         if self.target[1] is not None:
                             callback_id = b'000-revlog-split-%d-%s' % self.target
                         else:
                             callback_id = b'000-revlog-split-%d' % self.target[0]
                         tr.addfinalize(callback_id, finalize_callback)
                         tr.addabort(callback_id, abort_callback)
                     new_dfh = self._datafp(b'w+')
                     new_dfh.truncate(0)  # drop any potentially existing data
                     try:
                         with self.reading():
                             for r in self:
                                 new_dfh.write(self._getsegmentforrevs(r, r)[1])
                             new_dfh.flush()
                         if side_write:
                             self._indexfile = new_index_file_path
                         with self.__index_new_fp() as fp:
                             self._format_flags &= ~FLAG_INLINE_DATA
                             self._inline = False
                             for i in self:
                                 e = self.index.entry_binary(i)
                                 if i == 0 and self._docket is None:
                                     header = self._format_flags | self._format_version
                                     header = self.index.pack_header(header)
                                     e = header + e
                                 fp.write(e)
                             if self._docket is not None:
                                 self._docket.index_end = fp.tell()
                             # If we don't use side-write, the temp file replace the real
                             # index when we exit the context manager
                         nodemaputil.setup_persistent_nodemap(tr, self)
                         self._segmentfile = randomaccessfile.randomaccessfile(
                             self.opener,
                             self._datafile,
                             self.data_config.chunk_cache_size,
                         )
                         if existing_handles:
                             # switched from inline to conventional reopen the index
                             ifh = self.__index_write_fp()
                             self._writinghandles = (ifh, new_dfh, None)
                             self._segmentfile.writing_handle = new_dfh
                             new_dfh = None
                             # No need to deal with sidedata writing handle as it is only
                             # relevant with revlog-v2 which is never inline, not reaching
                             # this code
                     finally:
                         if new_dfh is not None:
                             new_dfh.close()
                 def _nodeduplicatecallback(self, transaction, node):
                     """called when trying to add a node already stored."""
                 @contextlib.contextmanager
                 def reading(self):
                     """Context manager that keeps data and sidedata files open for reading"""
                     if len(self.index) == 0:
                         yield  # nothing to be read
                     else:
                         with self._segmentfile.reading():
                             with self._segmentfile_sidedata.reading():
                                 yield
                 @contextlib.contextmanager
                 def _writing(self, transaction):
                     if self._trypending:
                         msg = b'try to write in a `trypending` revlog: %s'
                         msg %= self.display_id
                         raise error.ProgrammingError(msg)
                     if self._writinghandles is not None:
                         yield
                     else:
                         ifh = dfh = sdfh = None
                         try:
                             r = len(self)
                             # opening the data file.
                             dsize = 0
                             if r:
                                 dsize = self.end(r - 1)
                             dfh = None
                             if not self._inline:
                                 try:
                                     dfh = self._datafp(b"r+")
                                     if self._docket is None:
                                         dfh.seek(0, os.SEEK_END)
                                     else:
                                         dfh.seek(self._docket.data_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     dfh = self._datafp(b"w+")
                                 transaction.add(self._datafile, dsize)
                             if self._sidedatafile is not None:
                                 # revlog-v2 does not inline, help Pytype
                                 assert dfh is not None
                                 try:
                                     sdfh = self.opener(self._sidedatafile, mode=b"r+")
                                     dfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     sdfh = self.opener(self._sidedatafile, mode=b"w+")
                                 transaction.add(
                                     self._sidedatafile, self._docket.sidedata_end
                                 )
                             # opening the index file.
                             isize = r * self.index.entry_size
                             ifh = self.__index_write_fp()
                             if self._inline:
                                 transaction.add(self._indexfile, dsize + isize)
                             else:
                                 transaction.add(self._indexfile, isize)
                             # exposing all file handle for writing.
                             self._writinghandles = (ifh, dfh, sdfh)
                             self._segmentfile.writing_handle = ifh if self._inline else dfh
                             self._segmentfile_sidedata.writing_handle = sdfh
                             yield
                             if self._docket is not None:
                                 self._write_docket(transaction)
                         finally:
                             self._writinghandles = None
                             self._segmentfile.writing_handle = None
                             self._segmentfile_sidedata.writing_handle = None
                             if dfh is not None:
                                 dfh.close()
                             if sdfh is not None:
                                 sdfh.close()
                             # closing the index file last to avoid exposing referent to
                             # potential unflushed data content.
                             if ifh is not None:
                                 ifh.close()
                 def _write_docket(self, transaction):
                     """write the current docket on disk
                     Exist as a method to help changelog to implement transaction logic
                     We could also imagine using the same transaction logic for all revlog
                     since docket are cheap."""
                     self._docket.write(transaction)
                 def addrevision(
                     self,
                     text,
                     transaction,
                     link,
                     p1,
                     p2,
                     cachedelta=None,
                     node=None,
                     flags=REVIDX_DEFAULT_FLAGS,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     flags - the known flags to set on the revision
                     deltacomputer - an optional deltacomputer instance shared between
                         multiple calls
                     """
                     if link == nullrev:
                         raise error.RevlogError(
                             _(b"attempted to add linkrev -1 to %s") % self.display_id
                         )
                     if sidedata is None:
                         sidedata = {}
                     elif sidedata and not self.feature_config.has_side_data:
                         raise error.ProgrammingError(
                             _(b"trying to add sidedata to a revlog who don't support them")
                         )
                     if flags:
                         node = node or self.hash(text, p1, p2)
                     rawtext, validatehash = flagutil.processflagswrite(self, text, flags)
                     # If the flag processor modifies the revision data, ignore any provided
                     # cachedelta.
                     if rawtext != text:
                         cachedelta = None
                     if len(rawtext) > _maxentrysize:
                         raise error.RevlogError(
                             _(
                                 b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"
                             )
                             % (self.display_id, len(rawtext))
                         )
                     node = node or self.hash(rawtext, p1, p2)
                     rev = self.index.get_rev(node)
                     if rev is not None:
                         return rev
                     if validatehash:
                         self.checkhash(rawtext, node, p1=p1, p2=p2)
                     return self.addrawrevision(
                         rawtext,
                         transaction,
                         link,
                         p1,
                         p2,
                         node,
                         flags,
                         cachedelta=cachedelta,
                         deltacomputer=deltacomputer,
                         sidedata=sidedata,
                     )
                 def addrawrevision(
                     self,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     node,
                     flags,
                     cachedelta=None,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a raw revision with known flags, node and parents
                     useful when reusing a revision not stored in this revlog (ex: received
                     over wire, or read from an external bundle).
                     """
                     with self._writing(transaction):
                         return self._addrevision(
                             node,
                             rawtext,
                             transaction,
                             link,
                             p1,
                             p2,
                             flags,
                             cachedelta,
                             deltacomputer=deltacomputer,
                             sidedata=sidedata,
                         )
                 def compress(self, data):
                     """Generate a possibly-compressed representation of data."""
                     if not data:
                         return b'', data
                     compressed = self._compressor.compress(data)
                     if compressed:
                         # The revlog compressor added the header in the returned data.
                         return b'', compressed
                     if data[0:1] == b'\0':
                         return b'', data
                     return b'u', data
                 def decompress(self, data):
                     """Decompress a revlog chunk.
                     The chunk is expected to begin with a header identifying the
                     format type so it can be routed to an appropriate decompressor.
                     """
                     if not data:
                         return data
                     # Revlogs are read much more frequently than they are written and many
                     # chunks only take microseconds to decompress, so performance is
                     # important here.
                     #
                     # We can make a few assumptions about revlogs:
                     #
                     # 1) the majority of chunks will be compressed (as opposed to inline
                     #    raw data).
                     # 2) decompressing *any* data will likely by at least 10x slower than
                     #    returning raw inline data.
                     # 3) we want to prioritize common and officially supported compression
                     #    engines
                     #
                     # It follows that we want to optimize for "decompress compressed data
                     # when encoded with common and officially supported compression engines"
                     # case over "raw data" and "data encoded by less common or non-official
                     # compression engines." That is why we have the inline lookup first
                     # followed by the compengines lookup.
                     #
                     # According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
                     # compressed chunks. And this matters for changelog and manifest reads.
                     t = data[0:1]
                     if t == b'x':
                         try:
                             return _zlibdecompress(data)
                         except zlib.error as e:
                             raise error.RevlogError(
                                 _(b'revlog decompress error: %s')
                                 % stringutil.forcebytestr(e)
                             )
                     # '\0' is more common than 'u' so it goes first.
                     elif t == b'\0':
                         return data
                     elif t == b'u':
                         return util.buffer(data, 1)
                     compressor = self._get_decompressor(t)
                     return compressor.decompress(data)
                 def _addrevision(
                     self,
                     node,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     flags,
                     cachedelta,
                     alwayscache=False,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
                     if "deltacomputer" is not provided or None, a defaultdeltacomputer will
                     be used.
                     invariants:
                     - rawtext is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     if node == self.nullid:
                         raise error.RevlogError(
                             _(b"%s: attempt to add null revision") % self.display_id
                         )
                     if (
                         node == self.nodeconstants.wdirid
                         or node in self.nodeconstants.wdirfilenodeids
                     ):
                         raise error.RevlogError(
                             _(b"%s: attempt to add wdir revision") % self.display_id
                         )
                     if self._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     btext = [rawtext]
                     curr = len(self)
                     prev = curr - 1
                     offset = self._get_data_offset(prev)
                     if self._concurrencychecker:
                         ifh, dfh, sdfh = self._writinghandles
                         # XXX no checking for the sidedata file
                         if self._inline:
                             # offset is "as if" it were in the .d file, so we need to add on
                             # the size of the entry metadata.
                             self._concurrencychecker(
                                 ifh, self._indexfile, offset + curr * self.index.entry_size
                             )
                         else:
                             # Entries in the .i are a consistent size.
                             self._concurrencychecker(
                                 ifh, self._indexfile, curr * self.index.entry_size
                             )
                             self._concurrencychecker(dfh, self._datafile, offset)
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if rawtext is None:
                         # need rawtext size, before changed by flag processors, which is
                         # the non-raw size. use revlog explicitly to avoid filelog's extra
                         # logic that might remove metadata size.
                         textlen = mdiff.patchedsize(
                             revlog.size(self, cachedelta[0]), cachedelta[1]
                         )
                     else:
                         textlen = len(rawtext)
                     if deltacomputer is None:
                         write_debug = None
                         if self.delta_config.debug_delta:
                             write_debug = transaction._report
                         deltacomputer = deltautil.deltacomputer(
                             self, write_debug=write_debug
                         )
                     if cachedelta is not None and len(cachedelta) == 2:
                         # If the cached delta has no information about how it should be
                         # reused, add the default reuse instruction according to the
                         # revlog's configuration.
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse = DELTA_BASE_REUSE_NO
                         cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)
                     revinfo = revlogutils.revisioninfo(
                         node,
                         p1,
                         p2,
                         btext,
                         textlen,
                         cachedelta,
                         flags,
                     )
                     deltainfo = deltacomputer.finddeltainfo(revinfo)
                     compression_mode = COMP_MODE_INLINE
                     if self._docket is not None:
                         default_comp = self._docket.default_compression_header
                         r = deltautil.delta_compression(default_comp, deltainfo)
                         compression_mode, deltainfo = r
                     sidedata_compression_mode = COMP_MODE_INLINE
                     if sidedata and self.feature_config.has_side_data:
                         sidedata_compression_mode = COMP_MODE_PLAIN
                         serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)
                         sidedata_offset = self._docket.sidedata_end
                         h, comp_sidedata = self.compress(serialized_sidedata)
                         if (
                             h != b'u'
                             and comp_sidedata[0:1] != b'\0'
                             and len(comp_sidedata) < len(serialized_sidedata)
                         ):
                             assert not h
                             if (
                                 comp_sidedata[0:1]
                                 == self._docket.default_compression_header
                             ):
                                 sidedata_compression_mode = COMP_MODE_DEFAULT
                                 serialized_sidedata = comp_sidedata
                             else:
                                 sidedata_compression_mode = COMP_MODE_INLINE
                                 serialized_sidedata = comp_sidedata
                     else:
                         serialized_sidedata = b""
                         # Don't store the offset if the sidedata is empty, that way
                         # we can easily detect empty sidedata and they will be no different
                         # than ones we manually add.
                         sidedata_offset = 0
                     rank = RANK_UNKNOWN
-                    if self._compute_rank:
+                    if self.feature_config.compute_rank:
                         if (p1r, p2r) == (nullrev, nullrev):
                             rank = 1
                         elif p1r != nullrev and p2r == nullrev:
                             rank = 1 + self.fast_rank(p1r)
                         elif p1r == nullrev and p2r != nullrev:
                             rank = 1 + self.fast_rank(p2r)
                         else:  # merge node
                             if rustdagop is not None and self.index.rust_ext_compat:
                                 rank = rustdagop.rank(self.index, p1r, p2r)
                             else:
                                 pmin, pmax = sorted((p1r, p2r))
                                 rank = 1 + self.fast_rank(pmax)
                                 rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))
                     e = revlogutils.entry(
                         flags=flags,
                         data_offset=offset,
                         data_compressed_length=deltainfo.deltalen,
                         data_uncompressed_length=textlen,
                         data_compression_mode=compression_mode,
                         data_delta_base=deltainfo.base,
                         link_rev=link,
                         parent_rev_1=p1r,
                         parent_rev_2=p2r,
                         node_id=node,
                         sidedata_offset=sidedata_offset,
                         sidedata_compressed_length=len(serialized_sidedata),
                         sidedata_compression_mode=sidedata_compression_mode,
                         rank=rank,
                     )
                     self.index.append(e)
                     entry = self.index.entry_binary(curr)
                     if curr == 0 and self._docket is None:
                         header = self._format_flags | self._format_version
                         header = self.index.pack_header(header)
                         entry = header + entry
                     self._writeentry(
                         transaction,
                         entry,
                         deltainfo.data,
                         link,
                         offset,
                         serialized_sidedata,
                         sidedata_offset,
                     )
                     rawtext = btext[0]
                     if alwayscache and rawtext is None:
                         rawtext = deltacomputer.buildtext(revinfo)
                     if type(rawtext) == bytes:  # only accept immutable objects
                         self._revisioncache = (node, curr, rawtext)
                     self._chainbasecache[curr] = deltainfo.chainbase
                     return curr
                 def _get_data_offset(self, prev):
                     """Returns the current offset in the (in-transaction) data file.
                     Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket
                     file to store that information: since sidedata can be rewritten to the
                     end of the data file within a transaction, you can have cases where, for
                     example, rev `n` does not have sidedata while rev `n - 1` does, leading
                     to `n - 1`'s sidedata being written after `n`'s data.
                     TODO cache this in a docket file before getting out of experimental."""
                     if self._docket is None:
                         return self.end(prev)
                     else:
                         return self._docket.data_end
                 def _writeentry(
                     self, transaction, entry, data, link, offset, sidedata, sidedata_offset
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     if self._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     ifh, dfh, sdfh = self._writinghandles
                     if self._docket is None:
                         ifh.seek(0, os.SEEK_END)
                     else:
                         ifh.seek(self._docket.index_end, os.SEEK_SET)
                     if dfh:
                         if self._docket is None:
                             dfh.seek(0, os.SEEK_END)
                         else:
                             dfh.seek(self._docket.data_end, os.SEEK_SET)
                     if sdfh:
                         sdfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                     curr = len(self) - 1
                     if not self._inline:
                         transaction.add(self._datafile, offset)
                         if self._sidedatafile:
                             transaction.add(self._sidedatafile, sidedata_offset)
                         transaction.add(self._indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         if sidedata:
                             sdfh.write(sidedata)
                         ifh.write(entry)
                     else:
                         offset += curr * self.index.entry_size
                         transaction.add(self._indexfile, offset)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         assert not sidedata
                         self._enforceinlinesize(transaction)
                     if self._docket is not None:
                         # revlog-v2 always has 3 writing handles, help Pytype
                         wh1 = self._writinghandles[0]
                         wh2 = self._writinghandles[1]
                         wh3 = self._writinghandles[2]
                         assert wh1 is not None
                         assert wh2 is not None
                         assert wh3 is not None
                         self._docket.index_end = wh1.tell()
                         self._docket.data_end = wh2.tell()
                         self._docket.sidedata_end = wh3.tell()
                     nodemaputil.setup_persistent_nodemap(transaction, self)
                 def addgroup(
                     self,
                     deltas,
                     linkmapper,
                     transaction,
                     alwayscache=False,
                     addrevisioncb=None,
                     duplicaterevisioncb=None,
                     debug_info=None,
                     delta_base_reuse_policy=None,
                 ):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     If ``addrevisioncb`` is defined, it will be called with arguments of
                     this revlog and the node that was added.
                     """
                     if self._adding_group:
                         raise error.ProgrammingError(b'cannot nest addgroup() calls')
                     # read the default delta-base reuse policy from revlog config if the
                     # group did not specify one.
                     if delta_base_reuse_policy is None:
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse_policy = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse_policy = DELTA_BASE_REUSE_NO
                     self._adding_group = True
                     empty = True
                     try:
                         with self._writing(transaction):
                             write_debug = None
                             if self.delta_config.debug_delta:
                                 write_debug = transaction._report
                             deltacomputer = deltautil.deltacomputer(
                                 self,
                                 write_debug=write_debug,
                                 debug_info=debug_info,
                             )
                             # loop through our set of deltas
                             for data in deltas:
                                 (
                                     node,
                                     p1,
                                     p2,
                                     linknode,
                                     deltabase,
                                     delta,
                                     flags,
                                     sidedata,
                                 ) = data
                                 link = linkmapper(linknode)
                                 flags = flags or REVIDX_DEFAULT_FLAGS
                                 rev = self.index.get_rev(node)
                                 if rev is not None:
                                     # this can happen if two branches make the same change
                                     self._nodeduplicatecallback(transaction, rev)
                                     if duplicaterevisioncb:
                                         duplicaterevisioncb(self, rev)
                                     empty = False
                                     continue
                                 for p in (p1, p2):
                                     if not self.index.has_node(p):
                                         raise error.LookupError(
                                             p, self.radix, _(b'unknown parent')
                                         )
                                 if not self.index.has_node(deltabase):
                                     raise error.LookupError(
                                         deltabase, self.display_id, _(b'unknown delta base')
                                     )
                                 baserev = self.rev(deltabase)
                                 if baserev != nullrev and self.iscensored(baserev):
                                     # if base is censored, delta must be full replacement in a
                                     # single patch operation
                                     hlen = struct.calcsize(b">lll")
                                     oldlen = self.rawsize(baserev)
                                     newlen = len(delta) - hlen
                                     if delta[:hlen] != mdiff.replacediffheader(
                                         oldlen, newlen
                                     ):
                                         raise error.CensoredBaseError(
                                             self.display_id, self.node(baserev)
                                         )
                                 if not flags and self._peek_iscensored(baserev, delta):
                                     flags |= REVIDX_ISCENSORED
                                 # We assume consumers of addrevisioncb will want to retrieve
                                 # the added revision, which will require a call to
                                 # revision(). revision() will fast path if there is a cache
                                 # hit. So, we tell _addrevision() to always cache in this case.
                                 # We're only using addgroup() in the context of changegroup
                                 # generation so the revision data can always be handled as raw
                                 # by the flagprocessor.
                                 rev = self._addrevision(
                                     node,
                                     None,
                                     transaction,
                                     link,
                                     p1,
                                     p2,
                                     flags,
                                     (baserev, delta, delta_base_reuse_policy),
                                     alwayscache=alwayscache,
                                     deltacomputer=deltacomputer,
                                     sidedata=sidedata,
                                 )
                                 if addrevisioncb:
                                     addrevisioncb(self, rev)
                                 empty = False
                     finally:
                         self._adding_group = False
                     return not empty
                 def iscensored(self, rev):
                     """Check if a file revision is censored."""
                     if not self.feature_config.censorable:
                         return False
                     return self.flags(rev) & REVIDX_ISCENSORED
                 def _peek_iscensored(self, baserev, delta):
                     """Quickly check if a delta produces a censored revision."""
                     if not self.feature_config.censorable:
                         return False
                     return storageutil.deltaiscensored(delta, baserev, self.rawsize)
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     return storageutil.resolvestripinfo(
                         minlink,
                         len(self) - 1,
                         self.headrevs(),
                         self.linkrev,
                         self.parentrevs,
                     )
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     data_end = self.start(rev)
                     if not self._inline:
                         transaction.add(self._datafile, data_end)
                         end = rev * self.index.entry_size
                     else:
                         end = data_end + (rev * self.index.entry_size)
                     if self._sidedatafile:
                         sidedata_end = self.sidedata_cut_off(rev)
                         transaction.add(self._sidedatafile, sidedata_end)
                     transaction.add(self._indexfile, end)
                     if self._docket is not None:
                         # XXX we could, leverage the docket while stripping. However it is
                         # not powerfull enough at the time of this comment
                         self._docket.index_end = end
                         self._docket.data_end = data_end
                         self._docket.sidedata_end = sidedata_end
                         self._docket.write(transaction, stripping=True)
                     # then reset internal state in memory to forget those revisions
                     self._revisioncache = None
                     self._chaininfocache = util.lrucachedict(500)
                     self._segmentfile.clear_cache()
                     self._segmentfile_sidedata.clear_cache()
                     del self.index[rev:-1]
                 def checksize(self):
                     """Check size of index and data files
                     return a (dd, di) tuple.
                     - dd: extra bytes for the "data" file
                     - di: extra bytes for the "index" file
                     A healthy revlog will return (0, 0).
                     """
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         with self._datafp() as f:
                             f.seek(0, io.SEEK_END)
                             actual = f.tell()
                         dd = actual - expected
                     except FileNotFoundError:
                         dd = 0
                     try:
                         f = self.opener(self._indexfile)
                         f.seek(0, io.SEEK_END)
                         actual = f.tell()
                         f.close()
                         s = self.index.entry_size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except FileNotFoundError:
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self._indexfile]
                     if self._docket_file is None:
                         if not self._inline:
                             res.append(self._datafile)
                     else:
                         res.append(self._docket_file)
                         res.extend(self._docket.old_index_filepaths(include_empty=False))
                         if self._docket.data_end:
                             res.append(self._datafile)
                         res.extend(self._docket.old_data_filepaths(include_empty=False))
                         if self._docket.sidedata_end:
                             res.append(self._sidedatafile)
                         res.extend(self._docket.old_sidedata_filepaths(include_empty=False))
                     return res
                 def emitrevisions(
                     self,
                     nodes,
                     nodesorder=None,
                     revisiondata=False,
                     assumehaveparentrevisions=False,
                     deltamode=repository.CG_DELTAMODE_STD,
                     sidedata_helpers=None,
                     debug_info=None,
                 ):
                     if nodesorder not in (b'nodes', b'storage', b'linear', None):
                         raise error.ProgrammingError(
                             b'unhandled value for nodesorder: %s' % nodesorder
                         )
                     if nodesorder is None and not self.delta_config.general_delta:
                         nodesorder = b'storage'
                     if (
                         not self._storedeltachains
                         and deltamode != repository.CG_DELTAMODE_PREV
                     ):
                         deltamode = repository.CG_DELTAMODE_FULL
                     return storageutil.emitrevisions(
                         self,
                         nodes,
                         nodesorder,
                         revlogrevisiondelta,
                         deltaparentfn=self.deltaparent,
                         candeltafn=self._candelta,
                         rawsizefn=self.rawsize,
                         revdifffn=self.revdiff,
                         flagsfn=self.flags,
                         deltamode=deltamode,
                         revisiondata=revisiondata,
                         assumehaveparentrevisions=assumehaveparentrevisions,
                         sidedata_helpers=sidedata_helpers,
                         debug_info=debug_info,
                     )
                 DELTAREUSEALWAYS = b'always'
                 DELTAREUSESAMEREVS = b'samerevs'
                 DELTAREUSENEVER = b'never'
                 DELTAREUSEFULLADD = b'fulladd'
                 DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}
                 def clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb=None,
                     deltareuse=DELTAREUSESAMEREVS,
                     forcedeltabothparents=None,
                     sidedata_helpers=None,
                 ):
                     """Copy this revlog to another, possibly with format changes.
                     The destination revlog will contain the same revisions and nodes.
                     However, it may not be bit-for-bit identical due to e.g. delta encoding
                     differences.
                     The ``deltareuse`` argument control how deltas from the existing revlog
                     are preserved in the destination revlog. The argument can have the
                     following values:
                     DELTAREUSEALWAYS
                        Deltas will always be reused (if possible), even if the destination
                        revlog would not select the same revisions for the delta. This is the
                        fastest mode of operation.
                     DELTAREUSESAMEREVS
                        Deltas will be reused if the destination revlog would pick the same
                        revisions for the delta. This mode strikes a balance between speed
                        and optimization.
                     DELTAREUSENEVER
                        Deltas will never be reused. This is the slowest mode of execution.
                        This mode can be used to recompute deltas (e.g. if the diff/delta
                        algorithm changes).
                     DELTAREUSEFULLADD
                        Revision will be re-added as if their were new content. This is
                        slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.
                        eg: large file detection and handling.
                     Delta computation can be slow, so the choice of delta reuse policy can
                     significantly affect run time.
                     The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
                     two extremes. Deltas will be reused if they are appropriate. But if the
                     delta could choose a better revision, it will do so. This means if you
                     are converting a non-generaldelta revlog to a generaldelta revlog,
                     deltas will be recomputed if the delta's parent isn't a parent of the
                     revision.
                     In addition to the delta policy, the ``forcedeltabothparents``
                     argument controls whether to force compute deltas against both parents
                     for merges. By default, the current default is used.
                     See `revlogutil.sidedata.get_sidedata_helpers` for the doc on
                     `sidedata_helpers`.
                     """
                     if deltareuse not in self.DELTAREUSEALL:
                         raise ValueError(
                             _(b'value for deltareuse invalid: %s') % deltareuse
                         )
                     if len(destrevlog):
                         raise ValueError(_(b'destination revlog is not empty'))
                     if getattr(self, 'filteredrevs', None):
                         raise ValueError(_(b'source revlog has filtered revisions'))
                     if getattr(destrevlog, 'filteredrevs', None):
                         raise ValueError(_(b'destination revlog has filtered revisions'))
                     # lazydelta and lazydeltabase controls whether to reuse a cached delta,
                     # if possible.
                     old_delta_config = destrevlog.delta_config
                     destrevlog.delta_config = destrevlog.delta_config.copy()
                     try:
                         if deltareuse == self.DELTAREUSEALWAYS:
                             destrevlog.delta_config.lazy_delta_base = True
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSESAMEREVS:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSENEVER:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = False
                         delta_both_parents = (
                             forcedeltabothparents or old_delta_config.delta_both_parents
                         )
                         destrevlog.delta_config.delta_both_parents = delta_both_parents
                         with self.reading():
                             self._clone(
                                 tr,
                                 destrevlog,
                                 addrevisioncb,
                                 deltareuse,
                                 forcedeltabothparents,
                                 sidedata_helpers,
                             )
                     finally:
                         destrevlog.delta_config = old_delta_config
                 def _clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb,
                     deltareuse,
                     forcedeltabothparents,
                     sidedata_helpers,
                 ):
                     """perform the core duty of `revlog.clone` after parameter processing"""
                     write_debug = None
                     if self.delta_config.debug_delta:
                         write_debug = tr._report
                     deltacomputer = deltautil.deltacomputer(
                         destrevlog,
                         write_debug=write_debug,
                     )
                     index = self.index
                     for rev in self:
                         entry = index[rev]
                         # Some classes override linkrev to take filtered revs into
                         # account. Use raw entry from index.
                         flags = entry[0] & 0xFFFF
                         linkrev = entry[4]
                         p1 = index[entry[5]][7]
                         p2 = index[entry[6]][7]
                         node = entry[7]
                         # (Possibly) reuse the delta from the revlog if allowed and
                         # the revlog chunk is a delta.
                         cachedelta = None
                         rawtext = None
                         if deltareuse == self.DELTAREUSEFULLADD:
                             text = self._revisiondata(rev)
                             sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             destrevlog.addrevision(
                                 text,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 cachedelta=cachedelta,
                                 node=node,
                                 flags=flags,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         else:
                             if destrevlog._lazydelta:
                                 dp = self.deltaparent(rev)
                                 if dp != nullrev:
                                     cachedelta = (dp, bytes(self._chunk(rev)))
                             sidedata = None
                             if not cachedelta:
                                 rawtext = self._revisiondata(rev)
                                 sidedata = self.sidedata(rev)
                             if sidedata is None:
                                 sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             with destrevlog._writing(tr):
                                 destrevlog._addrevision(
                                     node,
                                     rawtext,
                                     tr,
                                     linkrev,
                                     p1,
                                     p2,
                                     flags,
                                     cachedelta,
                                     deltacomputer=deltacomputer,
                                     sidedata=sidedata,
                                 )
                         if addrevisioncb:
                             addrevisioncb(self, rev, node)
                 def censorrevision(self, tr, censornode, tombstone=b''):
                     if self._format_version == REVLOGV0:
                         raise error.RevlogError(
                             _(b'cannot censor with version %d revlogs')
                             % self._format_version
                         )
                     elif self._format_version == REVLOGV1:
                         rewrite.v1_censor(self, tr, censornode, tombstone)
                     else:
                         rewrite.v2_censor(self, tr, censornode, tombstone)
                 def verifyintegrity(self, state):
                     """Verifies the integrity of the revlog.
                     Yields ``revlogproblem`` instances describing problems that are
                     found.
                     """
                     dd, di = self.checksize()
                     if dd:
                         yield revlogproblem(error=_(b'data length off by %d bytes') % dd)
                     if di:
                         yield revlogproblem(error=_(b'index contains %d extra bytes') % di)
                     version = self._format_version
                     # The verifier tells us what version revlog we should be.
                     if version != state[b'expectedversion']:
                         yield revlogproblem(
                             warning=_(b"warning: '%s' uses revlog format %d; expected %d")
                             % (self.display_id, version, state[b'expectedversion'])
                         )
                     state[b'skipread'] = set()
                     state[b'safe_renamed'] = set()
                     for rev in self:
                         node = self.node(rev)
                         # Verify contents. 4 cases to care about:
                         #
                         #   common: the most common case
                         #   rename: with a rename
                         #   meta: file content starts with b'\1\n', the metadata
                         #         header defined in filelog.py, but without a rename
                         #   ext: content stored externally
                         #
                         # More formally, their differences are shown below:
                         #
                         #                       | common | rename | meta  | ext
                         #  -------------------------------------------------------
                         #   flags()             | 0      | 0      | 0     | not 0
                         #   renamed()           | False  | True   | False | ?
                         #   rawtext[0:2]=='\1\n'| False  | True   | True  | ?
                         #
                         # "rawtext" means the raw text stored in revlog data, which
                         # could be retrieved by "rawdata(rev)". "text"
                         # mentioned below is "revision(rev)".
                         #
                         # There are 3 different lengths stored physically:
                         #  1. L1: rawsize, stored in revlog index
                         #  2. L2: len(rawtext), stored in revlog data
                         #  3. L3: len(text), stored in revlog data if flags==0, or
                         #     possibly somewhere else if flags!=0
                         #
                         # L1 should be equal to L2. L3 could be different from them.
                         # "text" may or may not affect commit hash depending on flag
                         # processors (see flagutil.addflagprocessor).
                         #
                         #              | common  | rename | meta  | ext
                         # -------------------------------------------------
                         #    rawsize() | L1      | L1     | L1    | L1
                         #       size() | L1      | L2-LM  | L1(*) | L1 (?)
                         # len(rawtext) | L2      | L2     | L2    | L2
                         #    len(text) | L2      | L2     | L2    | L3
                         #  len(read()) | L2      | L2-LM  | L2-LM | L3 (?)
                         #
                         # LM:  length of metadata, depending on rawtext
                         # (*): not ideal, see comment in filelog.size
                         # (?): could be "- len(meta)" if the resolved content has
                         #      rename metadata
                         #
                         # Checks needed to be done:
                         #  1. length check: L1 == L2, in all cases.
                         #  2. hash check: depending on flag processor, we may need to
                         #     use either "text" (external), or "rawtext" (in revlog).
                         try:
                             skipflags = state.get(b'skipflags', 0)
                             if skipflags:
                                 skipflags &= self.flags(rev)
                             _verify_revision(self, skipflags, state, node)
                             l1 = self.rawsize(rev)
                             l2 = len(self.rawdata(node))
                             if l1 != l2:
                                 yield revlogproblem(
                                     error=_(b'unpacked size is %d, %d expected') % (l2, l1),
                                     node=node,
                                 )
                         except error.CensoredNodeError:
                             if state[b'erroroncensored']:
                                 yield revlogproblem(
                                     error=_(b'censored file data'), node=node
                                 )
                                 state[b'skipread'].add(node)
                         except Exception as e:
                             yield revlogproblem(
                                 error=_(b'unpacking %s: %s')
                                 % (short(node), stringutil.forcebytestr(e)),
                                 node=node,
                             )
                             state[b'skipread'].add(node)
                 def storageinfo(
                     self,
                     exclusivefiles=False,
                     sharedfiles=False,
                     revisionscount=False,
                     trackedsize=False,
                     storedsize=False,
                 ):
                     d = {}
                     if exclusivefiles:
                         d[b'exclusivefiles'] = [(self.opener, self._indexfile)]
                         if not self._inline:
                             d[b'exclusivefiles'].append((self.opener, self._datafile))
                     if sharedfiles:
                         d[b'sharedfiles'] = []
                     if revisionscount:
                         d[b'revisionscount'] = len(self)
                     if trackedsize:
                         d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))
                     if storedsize:
                         d[b'storedsize'] = sum(
                             self.opener.stat(path).st_size for path in self.files()
                         )
                     return d
                 def rewrite_sidedata(self, transaction, helpers, startrev, endrev):
                     if not self.feature_config.has_side_data:
                         return
                     # revlog formats with sidedata support does not support inline
                     assert not self._inline
                     if not helpers[1] and not helpers[2]:
                         # Nothing to generate or remove
                         return
                     new_entries = []
                     # append the new sidedata
                     with self._writing(transaction):
                         ifh, dfh, sdfh = self._writinghandles
                         dfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                         current_offset = sdfh.tell()
                         for rev in range(startrev, endrev + 1):
                             entry = self.index[rev]
                             new_sidedata, flags = sidedatautil.run_sidedata_helpers(
                                 store=self,
                                 sidedata_helpers=helpers,
                                 sidedata={},
                                 rev=rev,
                             )
                             serialized_sidedata = sidedatautil.serialize_sidedata(
                                 new_sidedata
                             )
                             sidedata_compression_mode = COMP_MODE_INLINE
                             if serialized_sidedata and self.feature_config.has_side_data:
                                 sidedata_compression_mode = COMP_MODE_PLAIN
                                 h, comp_sidedata = self.compress(serialized_sidedata)
                                 if (
                                     h != b'u'
                                     and comp_sidedata[0] != b'\0'
                                     and len(comp_sidedata) < len(serialized_sidedata)
                                 ):
                                     assert not h
                                     if (
                                         comp_sidedata[0]
                                         == self._docket.default_compression_header
                                     ):
                                         sidedata_compression_mode = COMP_MODE_DEFAULT
                                         serialized_sidedata = comp_sidedata
                                     else:
                                         sidedata_compression_mode = COMP_MODE_INLINE
                                         serialized_sidedata = comp_sidedata
                             if entry[8] != 0 or entry[9] != 0:
                                 # rewriting entries that already have sidedata is not
                                 # supported yet, because it introduces garbage data in the
                                 # revlog.
                                 msg = b"rewriting existing sidedata is not supported yet"
                                 raise error.Abort(msg)
                             # Apply (potential) flags to add and to remove after running
                             # the sidedata helpers
                             new_offset_flags = entry[0] | flags[0] & ~flags[1]
                             entry_update = (
                                 current_offset,
                                 len(serialized_sidedata),
                                 new_offset_flags,
                                 sidedata_compression_mode,
                             )
                             # the sidedata computation might have move the file cursors around
                             sdfh.seek(current_offset, os.SEEK_SET)
                             sdfh.write(serialized_sidedata)
                             new_entries.append(entry_update)
                             current_offset += len(serialized_sidedata)
                             self._docket.sidedata_end = sdfh.tell()
                         # rewrite the new index entries
                         ifh.seek(startrev * self.index.entry_size)
                         for i, e in enumerate(new_entries):
                             rev = startrev + i
                             self.index.replace_sidedata_info(rev, *e)
                             packed = self.index.entry_binary(rev)
                             if rev == 0 and self._docket is None:
                                 header = self._format_flags | self._format_version
                                 header = self.index.pack_header(header)
                                 packed = header + packed
                             ifh.write(packed)